PyPI - pixeltable - Versions diffs - 0.3.2__py3-none-any.whl → 0.3.4__py3-none-any.whl - Mend

pixeltable 0.3.2py3-none-any.whl → 0.3.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pixeltable might be problematic. Click here for more details.

Files changed (150) hide show

pixeltable/__init__.py +64 -11
pixeltable/__version__.py +2 -2
pixeltable/catalog/__init__.py +1 -1
pixeltable/catalog/catalog.py +50 -27
pixeltable/catalog/column.py +27 -11
pixeltable/catalog/dir.py +6 -4
pixeltable/catalog/globals.py +8 -1
pixeltable/catalog/insertable_table.py +22 -12
pixeltable/catalog/named_function.py +10 -6
pixeltable/catalog/path.py +3 -2
pixeltable/catalog/path_dict.py +8 -6
pixeltable/catalog/schema_object.py +2 -1
pixeltable/catalog/table.py +121 -101
pixeltable/catalog/table_version.py +291 -142
pixeltable/catalog/table_version_path.py +8 -5
pixeltable/catalog/view.py +67 -26
pixeltable/dataframe.py +106 -81
pixeltable/env.py +28 -24
pixeltable/exec/__init__.py +2 -2
pixeltable/exec/aggregation_node.py +10 -4
pixeltable/exec/cache_prefetch_node.py +5 -3
pixeltable/exec/component_iteration_node.py +9 -9
pixeltable/exec/data_row_batch.py +21 -10
pixeltable/exec/exec_context.py +10 -3
pixeltable/exec/exec_node.py +23 -12
pixeltable/exec/expr_eval/evaluators.py +13 -7
pixeltable/exec/expr_eval/expr_eval_node.py +24 -15
pixeltable/exec/expr_eval/globals.py +30 -7
pixeltable/exec/expr_eval/row_buffer.py +5 -6
pixeltable/exec/expr_eval/schedulers.py +151 -31
pixeltable/exec/in_memory_data_node.py +8 -7
pixeltable/exec/row_update_node.py +15 -5
pixeltable/exec/sql_node.py +56 -27
pixeltable/exprs/__init__.py +2 -2
pixeltable/exprs/arithmetic_expr.py +57 -26
pixeltable/exprs/array_slice.py +1 -1
pixeltable/exprs/column_property_ref.py +2 -1
pixeltable/exprs/column_ref.py +20 -15
pixeltable/exprs/comparison.py +6 -2
pixeltable/exprs/compound_predicate.py +1 -3
pixeltable/exprs/data_row.py +2 -2
pixeltable/exprs/expr.py +108 -72
pixeltable/exprs/expr_dict.py +2 -1
pixeltable/exprs/expr_set.py +3 -1
pixeltable/exprs/function_call.py +39 -41
pixeltable/exprs/globals.py +1 -0
pixeltable/exprs/in_predicate.py +2 -2
pixeltable/exprs/inline_expr.py +20 -17
pixeltable/exprs/json_mapper.py +4 -2
pixeltable/exprs/json_path.py +12 -18
pixeltable/exprs/literal.py +5 -9
pixeltable/exprs/method_ref.py +1 -0
pixeltable/exprs/object_ref.py +1 -1
pixeltable/exprs/row_builder.py +32 -17
pixeltable/exprs/rowid_ref.py +14 -5
pixeltable/exprs/similarity_expr.py +11 -6
pixeltable/exprs/sql_element_cache.py +1 -1
pixeltable/exprs/type_cast.py +24 -9
pixeltable/ext/__init__.py +1 -0
pixeltable/ext/functions/__init__.py +1 -0
pixeltable/ext/functions/whisperx.py +2 -2
pixeltable/ext/functions/yolox.py +11 -11
pixeltable/func/aggregate_function.py +17 -13
pixeltable/func/callable_function.py +6 -6
pixeltable/func/expr_template_function.py +15 -14
pixeltable/func/function.py +16 -16
pixeltable/func/function_registry.py +11 -8
pixeltable/func/globals.py +4 -2
pixeltable/func/query_template_function.py +12 -13
pixeltable/func/signature.py +18 -9
pixeltable/func/tools.py +10 -17
pixeltable/func/udf.py +106 -11
pixeltable/functions/__init__.py +21 -2
pixeltable/functions/anthropic.py +16 -12
pixeltable/functions/fireworks.py +63 -5
pixeltable/functions/gemini.py +13 -3
pixeltable/functions/globals.py +18 -6
pixeltable/functions/huggingface.py +20 -38
pixeltable/functions/image.py +7 -3
pixeltable/functions/json.py +1 -0
pixeltable/functions/llama_cpp.py +1 -4
pixeltable/functions/mistralai.py +31 -20
pixeltable/functions/ollama.py +4 -18
pixeltable/functions/openai.py +231 -113
pixeltable/functions/replicate.py +11 -10
pixeltable/functions/string.py +70 -7
pixeltable/functions/timestamp.py +21 -8
pixeltable/functions/together.py +66 -52
pixeltable/functions/video.py +1 -0
pixeltable/functions/vision.py +14 -11
pixeltable/functions/whisper.py +2 -1
pixeltable/globals.py +60 -26
pixeltable/index/__init__.py +1 -1
pixeltable/index/btree.py +5 -3
pixeltable/index/embedding_index.py +15 -14
pixeltable/io/__init__.py +1 -1
pixeltable/io/external_store.py +30 -25
pixeltable/io/fiftyone.py +6 -14
pixeltable/io/globals.py +33 -27
pixeltable/io/hf_datasets.py +2 -1
pixeltable/io/label_studio.py +77 -68
pixeltable/io/pandas.py +36 -23
pixeltable/io/parquet.py +9 -12
pixeltable/iterators/__init__.py +1 -0
pixeltable/iterators/audio.py +205 -0
pixeltable/iterators/document.py +19 -8
pixeltable/iterators/image.py +6 -24
pixeltable/iterators/string.py +3 -6
pixeltable/iterators/video.py +1 -7
pixeltable/metadata/__init__.py +7 -1
pixeltable/metadata/converters/convert_10.py +2 -2
pixeltable/metadata/converters/convert_15.py +1 -5
pixeltable/metadata/converters/convert_16.py +2 -4
pixeltable/metadata/converters/convert_17.py +2 -4
pixeltable/metadata/converters/convert_18.py +2 -4
pixeltable/metadata/converters/convert_19.py +2 -5
pixeltable/metadata/converters/convert_20.py +1 -4
pixeltable/metadata/converters/convert_21.py +4 -6
pixeltable/metadata/converters/convert_22.py +1 -0
pixeltable/metadata/converters/convert_23.py +5 -5
pixeltable/metadata/converters/convert_24.py +12 -13
pixeltable/metadata/converters/convert_26.py +23 -0
pixeltable/metadata/converters/util.py +3 -4
pixeltable/metadata/notes.py +1 -0
pixeltable/metadata/schema.py +13 -2
pixeltable/plan.py +173 -98
pixeltable/share/__init__.py +0 -0
pixeltable/share/packager.py +218 -0
pixeltable/store.py +42 -26
pixeltable/type_system.py +102 -75
pixeltable/utils/arrow.py +7 -8
pixeltable/utils/coco.py +16 -17
pixeltable/utils/code.py +1 -1
pixeltable/utils/console_output.py +6 -3
pixeltable/utils/description_helper.py +7 -7
pixeltable/utils/documents.py +3 -1
pixeltable/utils/filecache.py +12 -7
pixeltable/utils/http_server.py +9 -8
pixeltable/utils/iceberg.py +14 -0
pixeltable/utils/media_store.py +3 -2
pixeltable/utils/pytorch.py +11 -14
pixeltable/utils/s3.py +1 -0
pixeltable/utils/sql.py +1 -0
pixeltable/utils/transactional_directory.py +2 -2
{pixeltable-0.3.2.dist-info → pixeltable-0.3.4.dist-info}/METADATA +9 -9
pixeltable-0.3.4.dist-info/RECORD +166 -0
pixeltable-0.3.2.dist-info/RECORD +0 -161
{pixeltable-0.3.2.dist-info → pixeltable-0.3.4.dist-info}/LICENSE +0 -0
{pixeltable-0.3.2.dist-info → pixeltable-0.3.4.dist-info}/WHEEL +0 -0
{pixeltable-0.3.2.dist-info → pixeltable-0.3.4.dist-info}/entry_points.txt +0 -0

pixeltable/exec/expr_eval/expr_eval_node.py CHANGED Viewed

@@ -4,24 +4,23 @@ import asyncio
 import logging
 import traceback
 from types import TracebackType
-from typing import Iterable, AsyncIterator, Optional, Union
+from typing import AsyncIterator, Iterable, Optional, Union
 import numpy as np
 import pixeltable.exceptions as excs
-from pixeltable import exprs
-from pixeltable import func
+from pixeltable import exprs, func
+from ..data_row_batch import DataRowBatch
+from ..exec_node import ExecNode
 from .evaluators import DefaultExprEvaluator, FnCallEvaluator
 from .globals import Evaluator, Scheduler
 from .row_buffer import RowBuffer
 from .schedulers import SCHEDULERS
-from ..data_row_batch import DataRowBatch
-from ..exec_node import ExecNode
 _logger = logging.getLogger('pixeltable')
 class ExprEvalNode(ExecNode):
     """
     Expression evaluation
@@ -35,10 +34,13 @@ class ExprEvalNode(ExecNode):
     TODO:
     - Literal handling: currently, Literal values are copied into slots via the normal evaluation mechanism, which is
       needless overhead; instead: pre-populate Literal slots in _init_row()
+    - dynamically determine MAX_BUFFERED_ROWS, based on the avg memory consumption of a row and our configured memory
+      limit
     - local model inference on gpu: currently, no attempt is made to ensure that models can fit onto the gpu
       simultaneously, which will cause errors; instead, the execution should be divided into sequential phases, each
       of which only contains a subset of the models which is known to fit onto the gpu simultaneously
     """
     maintain_input_order: bool  # True if we're returning rows in the order we received them from our input
     num_dependencies: np.ndarray  # number of dependencies for our output slots; indexed by slot idx
     outputs: np.ndarray  # bool per slot; True if this slot is part of our output
@@ -68,11 +70,15 @@ class ExprEvalNode(ExecNode):
     num_output_rows: int
     BATCH_SIZE = 64
-    MAX_BUFFERED_ROWS = 512  # maximum number of rows that have been dispatched but not yet returned
+    MAX_BUFFERED_ROWS = 2048  # maximum number of rows that have been dispatched but not yet returned
     def __init__(
-        self, row_builder: exprs.RowBuilder, output_exprs: Iterable[exprs.Expr], input_exprs: Iterable[exprs.Expr],
-        input: ExecNode, maintain_input_order: bool = True
+        self,
+        row_builder: exprs.RowBuilder,
+        output_exprs: Iterable[exprs.Expr],
+        input_exprs: Iterable[exprs.Expr],
+        input: ExecNode,
+        maintain_input_order: bool = True,
     ):
         super().__init__(row_builder, output_exprs, input_exprs, input)
         self.maintain_input_order = maintain_input_order
@@ -148,7 +154,9 @@ class ExprEvalNode(ExecNode):
                     self.row_pos_map[id(row)] = self.num_input_rows + idx
             self.num_input_rows += len(batch)
             self.avail_input_rows += len(batch)
-            _logger.debug(f'adding input: batch_size={len(batch)} #input_rows={self.num_input_rows} #avail={self.avail_input_rows}')
+            _logger.debug(
+                f'adding input: batch_size={len(batch)} #input_rows={self.num_input_rows} #avail={self.avail_input_rows}'
+            )
         except StopAsyncIteration:
             self.input_complete = True
             _logger.debug(f'finished input: #input_rows={self.num_input_rows}, #avail={self.avail_input_rows}')
@@ -175,11 +183,11 @@ class ExprEvalNode(ExecNode):
         rows: list[exprs.DataRow]
         if avail_current_batch_rows > num_rows:
             # we only need rows from current_input_batch
-            rows = self.current_input_batch.rows[self.input_row_idx:self.input_row_idx + num_rows]
+            rows = self.current_input_batch.rows[self.input_row_idx : self.input_row_idx + num_rows]
             self.input_row_idx += num_rows
         else:
             # we need rows from both current_/next_input_batch
-            rows = self.current_input_batch.rows[self.input_row_idx:]
+            rows = self.current_input_batch.rows[self.input_row_idx :]
             self.current_input_batch = self.next_input_batch
             self.next_input_batch = None
             self.input_row_idx = 0
@@ -236,6 +244,7 @@ class ExprEvalNode(ExecNode):
         exc_event_aw = asyncio.create_task(self.exc_event.wait(), name='exc_event.wait()')
         input_batch_aw: Optional[asyncio.Task] = None
         completed_aw: Optional[asyncio.Task] = None
+        closed_evaluators = False  # True after calling Evaluator.close()
         try:
             while True:
@@ -275,11 +284,12 @@ class ExprEvalNode(ExecNode):
                     assert self.output_buffer.num_rows == 0
                     return
-                if self.input_complete and self.avail_input_rows == 0:
+                if self.input_complete and self.avail_input_rows == 0 and not closed_evaluators:
                     # no more input rows to dispatch, but we're still waiting for rows to finish:
                     # close  all slot evaluators to flush queued rows
                     for evaluator in self.slot_evaluators.values():
                         evaluator.close()
+                    closed_evaluators = True
                 # we don't have a full batch of rows at this point and need to wait
                 aws = {exc_event_aw}  # always wait for an exception
@@ -335,8 +345,7 @@ class ExprEvalNode(ExecNode):
             first_row = rows[0]
             input_vals = [first_row[idx] for idx in dependency_idxs]
             e = self.row_builder.unique_exprs[slot_with_exc]
-            self.error = excs.ExprEvalError(
-                e, f'expression {e}', first_row.get_exc(e.slot_idx), exc_tb, input_vals, 0)
+            self.error = excs.ExprEvalError(e, f'expression {e}', first_row.get_exc(e.slot_idx), exc_tb, input_vals, 0)
             self.exc_event.set()
             return

pixeltable/exec/expr_eval/globals.py CHANGED Viewed

@@ -1,16 +1,18 @@
+from __future__ import annotations
 import abc
 import asyncio
 from dataclasses import dataclass
 from types import TracebackType
-from typing import Any, Protocol, Optional
+from typing import Any, Optional, Protocol
-from pixeltable import exprs
-from pixeltable import func
+from pixeltable import exprs, func
 @dataclass
 class FnCallArgs:
     """Container for everything needed to execute a FunctionCall against one or more DataRows"""
     fn_call: exprs.FunctionCall
     rows: list[exprs.DataRow]
     # single call
@@ -37,16 +39,36 @@ class FnCallArgs:
 class Scheduler(abc.ABC):
     """
-    Base class for schedulers. A scheduler executes FunctionCalls against a limited resource pool.
+    Base class for queueing schedulers. A scheduler executes FunctionCalls against a limited resource pool.
     Expected behavior:
     - all created tasks must be recorded in dispatcher.tasks
     - schedulers are responsible for aborting execution when a) the task is cancelled or b) when an exception occurred
       elsewhere (indicated by dispatcher.exc_event)
     """
-    @abc.abstractmethod
+    @dataclass(frozen=True)
+    class QueueItem:
+        """Container of work items for queueing schedulers"""
+        request: FnCallArgs
+        num_retries: int
+        def __lt__(self, other: Scheduler.QueueItem) -> bool:
+            # prioritize by number of retries (more retries = higher priority)
+            return self.num_retries > other.num_retries
+    resource_pool: str
+    queue: asyncio.PriorityQueue[QueueItem]  # prioritizes retries
+    dispatcher: Dispatcher
+    def __init__(self, resource_pool: str, dispatcher: Dispatcher):
+        self.resource_pool = resource_pool
+        self.queue = asyncio.PriorityQueue()
+        self.dispatcher = dispatcher
     def submit(self, item: FnCallArgs) -> None:
-        pass
+        self.queue.put_nowait(self.QueueItem(item, 0))
     @classmethod
     @abc.abstractmethod
@@ -63,6 +85,7 @@ class Dispatcher(Protocol):
     Exceptions: evaluators/schedulers need to check exc_event prior to starting long-running (non-interruptible)
         computations
     """
     row_builder: exprs.RowBuilder
     exc_event: asyncio.Event
     schedulers: dict[str, Scheduler]  # key: resource pool id
@@ -90,6 +113,7 @@ class Evaluator(abc.ABC):
     - evaluators are responsible for aborting execution when a) the task is cancelled or b) when an exception occurred
       elsewhere (indicated by dispatcher.exc_event)
     """
     dispatcher: Dispatcher
     is_closed: bool
@@ -110,4 +134,3 @@ class Evaluator(abc.ABC):
         """Indicates that there may not be any more rows getting scheduled"""
         self.is_closed = True
         self._close()

pixeltable/exec/expr_eval/row_buffer.py CHANGED Viewed

@@ -62,15 +62,14 @@ class RowBuffer:
             return []
         rows: list[exprs.DataRow]
         if self.head_idx + n <= self.size:
-            rows = self.buffer[self.head_idx:self.head_idx + n].tolist()
-            self.buffer[self.head_idx:self.head_idx + n] = None
+            rows = self.buffer[self.head_idx : self.head_idx + n].tolist()
+            self.buffer[self.head_idx : self.head_idx + n] = None
         else:
-            rows = np.concatenate([self.buffer[self.head_idx:], self.buffer[:self.head_idx + n - self.size]]).tolist()
-            self.buffer[self.head_idx:] = None
-            self.buffer[:self.head_idx + n - self.size] = None
+            rows = np.concatenate([self.buffer[self.head_idx :], self.buffer[: self.head_idx + n - self.size]]).tolist()
+            self.buffer[self.head_idx :] = None
+            self.buffer[: self.head_idx + n - self.size] = None
         self.head_pos += n
         self.head_idx = (self.head_idx + n) % self.size
         self.num_rows -= n
         self.num_ready -= n
         return rows

pixeltable/exec/expr_eval/schedulers.py CHANGED Viewed

@@ -5,12 +5,12 @@ import datetime
 import inspect
 import logging
 import sys
-from dataclasses import dataclass
-from typing import Optional, Awaitable, Collection
+import time
+from typing import Awaitable, Collection, Optional
-from pixeltable import env
-from pixeltable import func
-from .globals import Scheduler, FnCallArgs, Dispatcher
+from pixeltable import env, func
+from .globals import Dispatcher, FnCallArgs, Scheduler
 _logger = logging.getLogger('pixeltable')
@@ -29,19 +29,7 @@ class RateLimitsScheduler(Scheduler):
     TODO:
     - limit the number of in-flight requests based on the open file limit
     """
-    @dataclass(frozen=True)
-    class QueueItem:
-        request: FnCallArgs
-        num_retries: int
-        def __lt__(self, other: RateLimitsScheduler.QueueItem) -> bool:
-            # prioritize by number of retries
-            return self.num_retries > other.num_retries
-    resource_pool: str
-    queue: asyncio.PriorityQueue[QueueItem]  # prioritizes retries
-    loop_task: asyncio.Task
-    dispatcher: Dispatcher
     get_request_resources_param_names: list[str]  # names of parameters of RateLimitsInfo.get_request_resources()
     # scheduling-related state
@@ -58,11 +46,9 @@ class RateLimitsScheduler(Scheduler):
     MAX_RETRIES = 10
     def __init__(self, resource_pool: str, dispatcher: Dispatcher):
-        self.resource_pool = resource_pool
-        self.queue = asyncio.PriorityQueue()
-        self.dispatcher = dispatcher
-        self.loop_task = asyncio.create_task(self._main_loop())
-        self.dispatcher.register_task(self.loop_task)
+        super().__init__(resource_pool, dispatcher)
+        loop_task = asyncio.create_task(self._main_loop())
+        self.dispatcher.register_task(loop_task)
         self.pool_info = None  # initialized in _main_loop by the first request
         self.est_usage = {}
         self.num_in_flight = 0
@@ -104,6 +90,7 @@ class RateLimitsScheduler(Scheduler):
                 # wait for a single request to get rate limits
                 _logger.debug(f'initializing rate limits for {self.resource_pool}')
                 await self._exec(item.request, item.num_retries, is_task=False)
+                _logger.debug(f'initialized rate limits for {self.resource_pool}')
                 item = None
                 # if this was the first request, it created the pool_info
                 if self.pool_info is None:
@@ -111,6 +98,7 @@ class RateLimitsScheduler(Scheduler):
                 continue
             # check rate limits
+            _logger.debug(f'checking rate limits for {self.resource_pool}')
             request_resources = self._get_request_resources(item.request)
             limits_info = self._check_resource_limits(request_resources)
             aws: list[Awaitable[None]] = []
@@ -169,7 +157,6 @@ class RateLimitsScheduler(Scheduler):
             constant_kwargs, batch_kwargs = request.pxt_fn.create_batch_kwargs(batch_kwargs)
             return self.pool_info.get_request_resources(**constant_kwargs, **batch_kwargs)
     def _check_resource_limits(self, request_resources: dict[str, int]) -> Optional[env.RateLimitInfo]:
         """Returns the most depleted resource, relative to its limit, or None if all resources are within limits"""
         candidates: list[tuple[env.RateLimitInfo, float]] = []  # (info, relative usage)
@@ -191,7 +178,9 @@ class RateLimitsScheduler(Scheduler):
             start_ts = datetime.datetime.now(tz=datetime.timezone.utc)
             pxt_fn = request.fn_call.fn
             assert isinstance(pxt_fn, func.CallableFunction)
-            _logger.debug(f'scheduler {self.resource_pool}: start evaluating slot {request.fn_call.slot_idx}, batch_size={len(request.rows)}')
+            _logger.debug(
+                f'scheduler {self.resource_pool}: start evaluating slot {request.fn_call.slot_idx}, batch_size={len(request.rows)}'
+            )
             self.total_requests += 1
             if request.is_batched:
                 batch_result = await pxt_fn.aexec_batch(*request.batch_args, **request.batch_kwargs)
@@ -202,7 +191,9 @@ class RateLimitsScheduler(Scheduler):
                 result = await pxt_fn.aexec(*request.args, **request.kwargs)
                 request.row[request.fn_call.slot_idx] = result
             end_ts = datetime.datetime.now(tz=datetime.timezone.utc)
-            _logger.debug(f'scheduler {self.resource_pool}: evaluated slot {request.fn_call.slot_idx} in {end_ts - start_ts}, batch_size={len(request.rows)}')
+            _logger.debug(
+                f'scheduler {self.resource_pool}: evaluated slot {request.fn_call.slot_idx} in {end_ts - start_ts}, batch_size={len(request.rows)}'
+            )
             # purge accumulated usage estimate, now that we have a new report
             self.est_usage = {r: 0 for r in self._resources}
@@ -210,10 +201,11 @@ class RateLimitsScheduler(Scheduler):
             self.dispatcher.dispatch(request.rows)
         except Exception as exc:
             _logger.debug(f'scheduler {self.resource_pool}: exception in slot {request.fn_call.slot_idx}: {exc}')
-            if  self.pool_info is None:
+            if self.pool_info is None:
                 # our pool info should be available at this point
                 self._set_pool_info()
-            if num_retries < self.MAX_RETRIES and self.pool_info is not None:
+            assert self.pool_info is not None
+            if num_retries < self.MAX_RETRIES:
                 retry_delay = self.pool_info.get_retry_delay(exc)
                 if retry_delay is not None:
                     self.total_retried += 1
@@ -229,12 +221,140 @@ class RateLimitsScheduler(Scheduler):
                 row.set_exc(request.fn_call.slot_idx, exc)
             self.dispatcher.dispatch_exc(request.rows, request.fn_call.slot_idx, exc_tb)
         finally:
-            _logger.debug(
-                f'Scheduler stats: #requests={self.total_requests}, #retried={self.total_retried}')
+            _logger.debug(f'Scheduler stats: #requests={self.total_requests}, #retried={self.total_retried}')
             if is_task:
                 self.num_in_flight -= 1
                 self.request_completed.set()
+class RequestRateScheduler(Scheduler):
+    """
+    Scheduler for FunctionCalls with a fixed request rate limit and no runtime resource usage reports.
+    Rate limits are supplied in the config, in one of two ways:
+    - resource_pool='request-rate:<endpoint>':
+      * a single rate limit for all calls against that endpoint
+      * in the config: section '<endpoint>', key 'rate_limit'
+    - resource_pool='request-rate:<endpoint>:<model>':
+        * a single rate limit for all calls against that model
+        * in the config: section '<endpoint>.rate_limits', key '<model>'
+    - if no rate limit is found in the config, uses a default of 600 RPM
+    TODO:
+    - adaptive rate limiting based on 429 errors
+    """
+    secs_per_request: float  # inverted rate limit
+    num_in_flight: int
+    total_requests: int
+    total_retried: int
+    TIME_FORMAT = '%H:%M.%S %f'
+    MAX_RETRIES = 10
+    DEFAULT_RATE_LIMIT = 600  # requests per minute
+    def __init__(self, resource_pool: str, dispatcher: Dispatcher):
+        super().__init__(resource_pool, dispatcher)
+        loop_task = asyncio.create_task(self._main_loop())
+        self.dispatcher.register_task(loop_task)
+        self.num_in_flight = 0
+        self.total_requests = 0
+        self.total_retried = 0
+        # try to get the rate limit from the config
+        elems = resource_pool.split(':')
+        section: str
+        key: str
+        if len(elems) == 2:
+            # resource_pool: request-rate:endpoint
+            _, endpoint = elems
+            section = endpoint
+            key = 'rate_limit'
+        else:
+            # resource_pool: request-rate:endpoint:model
+            assert len(elems) == 3
+            _, endpoint, model = elems
+            section = f'{endpoint}.rate_limits'
+            key = model
+        requests_per_min = env.Env.get().config.get_int_value(key, section=section)
+        requests_per_min = requests_per_min or self.DEFAULT_RATE_LIMIT
+        self.secs_per_request = 1 / (requests_per_min / 60)
+    @classmethod
+    def matches(cls, resource_pool: str) -> bool:
+        return resource_pool.startswith('request-rate:')
+    async def _main_loop(self) -> None:
+        last_request_ts = 0.0
+        while True:
+            item = await self.queue.get()
+            if item.num_retries > 0:
+                self.total_retried += 1
+            now = time.monotonic()
+            if now - last_request_ts < self.secs_per_request:
+                wait_duration = self.secs_per_request - (now - last_request_ts)
+                _logger.debug(f'waiting for {wait_duration} for {self.resource_pool}')
+                await asyncio.sleep(wait_duration)
+            last_request_ts = time.monotonic()
+            if item.num_retries > 0:
+                # the last request encountered some problem: retry it synchronously, to wait for the problem to pass
+                _logger.debug(f'retrying request for {self.resource_pool}: #retries={item.num_retries}')
+                await self._exec(item.request, item.num_retries, is_task=False)
+                _logger.debug(f'retried request for {self.resource_pool}: #retries={item.num_retries}')
+            else:
+                _logger.debug(f'creating task for {self.resource_pool}')
+                self.num_in_flight += 1
+                task = asyncio.create_task(self._exec(item.request, item.num_retries, is_task=True))
+                self.dispatcher.register_task(task)
+    async def _exec(self, request: FnCallArgs, num_retries: int, is_task: bool) -> None:
+        assert all(not row.has_val[request.fn_call.slot_idx] for row in request.rows)
+        assert all(not row.has_exc(request.fn_call.slot_idx) for row in request.rows)
+        try:
+            start_ts = datetime.datetime.now(tz=datetime.timezone.utc)
+            pxt_fn = request.fn_call.fn
+            assert isinstance(pxt_fn, func.CallableFunction)
+            _logger.debug(
+                f'scheduler {self.resource_pool}: start evaluating slot {request.fn_call.slot_idx}, batch_size={len(request.rows)}'
+            )
+            self.total_requests += 1
+            if request.is_batched:
+                batch_result = await pxt_fn.aexec_batch(*request.batch_args, **request.batch_kwargs)
+                assert len(batch_result) == len(request.rows)
+                for row, result in zip(request.rows, batch_result):
+                    row[request.fn_call.slot_idx] = result
+            else:
+                result = await pxt_fn.aexec(*request.args, **request.kwargs)
+                request.row[request.fn_call.slot_idx] = result
+            end_ts = datetime.datetime.now(tz=datetime.timezone.utc)
+            _logger.debug(
+                f'scheduler {self.resource_pool}: evaluated slot {request.fn_call.slot_idx} in {end_ts - start_ts}, batch_size={len(request.rows)}'
+            )
+            self.dispatcher.dispatch(request.rows)
+        except Exception as exc:
+            # TODO: which exception can be retried?
+            _logger.debug(f'exception for {self.resource_pool}: {exc}')
+            status = getattr(exc, 'status', None)
+            _logger.debug(f'type={type(exc)} has_status={hasattr(exc, "status")} status={status}')
+            if num_retries < self.MAX_RETRIES:
+                self.queue.put_nowait(self.QueueItem(request, num_retries + 1))
+                return
+            # record the exception
+            _, _, exc_tb = sys.exc_info()
+            for row in request.rows:
+                row.set_exc(request.fn_call.slot_idx, exc)
+            self.dispatcher.dispatch_exc(request.rows, request.fn_call.slot_idx, exc_tb)
+        finally:
+            _logger.debug(
+                f'Scheduler stats: #in-flight={self.num_in_flight} #requests={self.total_requests}, #retried={self.total_retried}'
+            )
+            if is_task:
+                self.num_in_flight -= 1
 # all concrete Scheduler subclasses that implement matches()
-SCHEDULERS = [RateLimitsScheduler]
+SCHEDULERS = [RateLimitsScheduler, RequestRateScheduler]

pixeltable/exec/in_memory_data_node.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import logging
-from typing import Any, Iterator, Optional, AsyncIterator
+from typing import Any, AsyncIterator, Iterator, Optional
 import pixeltable.catalog as catalog
 import pixeltable.exprs as exprs
@@ -10,6 +10,7 @@ from .exec_node import ExecNode
 _logger = logging.getLogger('pixeltable')
 class InMemoryDataNode(ExecNode):
     """
     Outputs in-memory data as a DataRowBatch of a particular table.
@@ -18,6 +19,7 @@ class InMemoryDataNode(ExecNode):
     - with the values provided in the input rows
     - if an input row doesn't provide a value, sets the slot to the column default
     """
     tbl: catalog.TableVersion
     input_rows: list[dict[str, Any]]
     start_row_id: int
@@ -27,8 +29,7 @@ class InMemoryDataNode(ExecNode):
     output_exprs: list[exprs.ColumnRef]
     def __init__(
-        self, tbl: catalog.TableVersion, rows: list[dict[str, Any]],
-        row_builder: exprs.RowBuilder, start_row_id: int,
+        self, tbl: catalog.TableVersion, rows: list[dict[str, Any]], row_builder: exprs.RowBuilder, start_row_id: int
     ):
         # we materialize the input slots
         output_exprs = list(row_builder.input_exprs)
@@ -43,11 +44,11 @@ class InMemoryDataNode(ExecNode):
         """Create row batch and populate with self.input_rows"""
         user_cols_by_name = {
             col_ref.col.name: exprs.ColumnSlotIdx(col_ref.col, col_ref.slot_idx)
-            for col_ref in self.output_exprs if col_ref.col.name is not None
+            for col_ref in self.output_exprs
+            if col_ref.col.name is not None
         }
         output_cols_by_idx = {
-            col_ref.slot_idx: exprs.ColumnSlotIdx(col_ref.col, col_ref.slot_idx)
-            for col_ref in self.output_exprs
+            col_ref.slot_idx: exprs.ColumnSlotIdx(col_ref.col, col_ref.slot_idx) for col_ref in self.output_exprs
         }
         output_slot_idxs = {e.slot_idx for e in self.output_exprs}
@@ -68,7 +69,7 @@ class InMemoryDataNode(ExecNode):
                 input_slot_idxs.add(col_info.slot_idx)
             # set the remaining output slots to their default values (presently None)
-            missing_slot_idxs =  output_slot_idxs - input_slot_idxs
+            missing_slot_idxs = output_slot_idxs - input_slot_idxs
             for slot_idx in missing_slot_idxs:
                 col_info = output_cols_by_idx.get(slot_idx)
                 assert col_info is not None

pixeltable/exec/row_update_node.py CHANGED Viewed

@@ -4,11 +4,13 @@ from typing import Any, AsyncIterator
 import pixeltable.catalog as catalog
 import pixeltable.exprs as exprs
 from pixeltable.utils.media_store import MediaStore
 from .data_row_batch import DataRowBatch
 from .exec_node import ExecNode
 _logger = logging.getLogger('pixeltable')
 class RowUpdateNode(ExecNode):
     """
     Update individual rows in the input batches, identified by key columns.
@@ -17,9 +19,15 @@ class RowUpdateNode(ExecNode):
     The node assumes that all update dicts contain the same keys, and it populates the slots of the columns present in
     the update list.
     """
     def __init__(
-            self, tbl: catalog.TableVersionPath, key_vals_batch: list[tuple], is_rowid_key: bool,
-            col_vals_batch: list[dict[catalog.Column, Any]], row_builder: exprs.RowBuilder, input: ExecNode,
+        self,
+        tbl: catalog.TableVersionPath,
+        key_vals_batch: list[tuple],
+        is_rowid_key: bool,
+        col_vals_batch: list[dict[catalog.Column, Any]],
+        row_builder: exprs.RowBuilder,
+        input: ExecNode,
     ):
         super().__init__(row_builder, [], [], input)
         self.updates = {key_vals: col_vals for key_vals, col_vals in zip(key_vals_batch, col_vals_batch)}
@@ -28,7 +36,8 @@ class RowUpdateNode(ExecNode):
         # retrieve ColumnRefs from the RowBuilder (has slot_idx set)
         all_col_slot_idxs = {
             col_ref.col: col_ref.slot_idx
-            for col_ref in row_builder.unique_exprs if isinstance(col_ref, exprs.ColumnRef)
+            for col_ref in row_builder.unique_exprs
+            if isinstance(col_ref, exprs.ColumnRef)
         }
         self.col_slot_idxs = {col: all_col_slot_idxs[col] for col in col_vals_batch[0].keys()}
         self.key_slot_idxs = {col: all_col_slot_idxs[col] for col in tbl.tbl_version.primary_key_columns()}
@@ -37,8 +46,9 @@ class RowUpdateNode(ExecNode):
     async def __aiter__(self) -> AsyncIterator[DataRowBatch]:
         async for batch in self.input:
             for row in batch:
-                key_vals = row.rowid if self.is_rowid_key else \
-                    tuple(row[slot_idx] for slot_idx in self.key_slot_idxs.values())
+                key_vals = (
+                    row.rowid if self.is_rowid_key else tuple(row[slot_idx] for slot_idx in self.key_slot_idxs.values())
+                )
                 if key_vals not in self.updates:
                     continue
                 self.matched_key_vals.add(key_vals)

pixeltable 0.3.2__py3-none-any.whl → 0.3.4__py3-none-any.whl

Potentially problematic release.

pixeltable 0.3.2py3-none-any.whl → 0.3.4py3-none-any.whl