PyPI - pixeltable - Versions diffs - 0.2.26__py3-none-any.whl → 0.5.7__py3-none-any.whl - Mend

pixeltable 0.2.26py3-none-any.whl → 0.5.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (245) hide show

pixeltable/__init__.py +83 -19
pixeltable/_query.py +1444 -0
pixeltable/_version.py +1 -0
pixeltable/catalog/__init__.py +7 -4
pixeltable/catalog/catalog.py +2394 -119
pixeltable/catalog/column.py +225 -104
pixeltable/catalog/dir.py +38 -9
pixeltable/catalog/globals.py +53 -34
pixeltable/catalog/insertable_table.py +265 -115
pixeltable/catalog/path.py +80 -17
pixeltable/catalog/schema_object.py +28 -43
pixeltable/catalog/table.py +1270 -677
pixeltable/catalog/table_metadata.py +103 -0
pixeltable/catalog/table_version.py +1270 -751
pixeltable/catalog/table_version_handle.py +109 -0
pixeltable/catalog/table_version_path.py +137 -42
pixeltable/catalog/tbl_ops.py +53 -0
pixeltable/catalog/update_status.py +191 -0
pixeltable/catalog/view.py +251 -134
pixeltable/config.py +215 -0
pixeltable/env.py +736 -285
pixeltable/exceptions.py +26 -2
pixeltable/exec/__init__.py +7 -2
pixeltable/exec/aggregation_node.py +39 -21
pixeltable/exec/cache_prefetch_node.py +87 -109
pixeltable/exec/cell_materialization_node.py +268 -0
pixeltable/exec/cell_reconstruction_node.py +168 -0
pixeltable/exec/component_iteration_node.py +25 -28
pixeltable/exec/data_row_batch.py +11 -46
pixeltable/exec/exec_context.py +26 -11
pixeltable/exec/exec_node.py +35 -27
pixeltable/exec/expr_eval/__init__.py +3 -0
pixeltable/exec/expr_eval/evaluators.py +365 -0
pixeltable/exec/expr_eval/expr_eval_node.py +413 -0
pixeltable/exec/expr_eval/globals.py +200 -0
pixeltable/exec/expr_eval/row_buffer.py +74 -0
pixeltable/exec/expr_eval/schedulers.py +413 -0
pixeltable/exec/globals.py +35 -0
pixeltable/exec/in_memory_data_node.py +35 -27
pixeltable/exec/object_store_save_node.py +293 -0
pixeltable/exec/row_update_node.py +44 -29
pixeltable/exec/sql_node.py +414 -115
pixeltable/exprs/__init__.py +8 -5
pixeltable/exprs/arithmetic_expr.py +79 -45
pixeltable/exprs/array_slice.py +5 -5
pixeltable/exprs/column_property_ref.py +40 -26
pixeltable/exprs/column_ref.py +254 -61
pixeltable/exprs/comparison.py +14 -9
pixeltable/exprs/compound_predicate.py +9 -10
pixeltable/exprs/data_row.py +213 -72
pixeltable/exprs/expr.py +270 -104
pixeltable/exprs/expr_dict.py +6 -5
pixeltable/exprs/expr_set.py +20 -11
pixeltable/exprs/function_call.py +383 -284
pixeltable/exprs/globals.py +18 -5
pixeltable/exprs/in_predicate.py +7 -7
pixeltable/exprs/inline_expr.py +37 -37
pixeltable/exprs/is_null.py +8 -4
pixeltable/exprs/json_mapper.py +120 -54
pixeltable/exprs/json_path.py +90 -60
pixeltable/exprs/literal.py +61 -16
pixeltable/exprs/method_ref.py +7 -6
pixeltable/exprs/object_ref.py +19 -8
pixeltable/exprs/row_builder.py +238 -75
pixeltable/exprs/rowid_ref.py +53 -15
pixeltable/exprs/similarity_expr.py +65 -50
pixeltable/exprs/sql_element_cache.py +5 -5
pixeltable/exprs/string_op.py +107 -0
pixeltable/exprs/type_cast.py +25 -13
pixeltable/exprs/variable.py +2 -2
pixeltable/func/__init__.py +9 -5
pixeltable/func/aggregate_function.py +197 -92
pixeltable/func/callable_function.py +119 -35
pixeltable/func/expr_template_function.py +101 -48
pixeltable/func/function.py +375 -62
pixeltable/func/function_registry.py +20 -19
pixeltable/func/globals.py +6 -5
pixeltable/func/mcp.py +74 -0
pixeltable/func/query_template_function.py +151 -35
pixeltable/func/signature.py +178 -49
pixeltable/func/tools.py +164 -0
pixeltable/func/udf.py +176 -53
pixeltable/functions/__init__.py +44 -4
pixeltable/functions/anthropic.py +226 -47
pixeltable/functions/audio.py +148 -11
pixeltable/functions/bedrock.py +137 -0
pixeltable/functions/date.py +188 -0
pixeltable/functions/deepseek.py +113 -0
pixeltable/functions/document.py +81 -0
pixeltable/functions/fal.py +76 -0
pixeltable/functions/fireworks.py +72 -20
pixeltable/functions/gemini.py +249 -0
pixeltable/functions/globals.py +208 -53
pixeltable/functions/groq.py +108 -0
pixeltable/functions/huggingface.py +1088 -95
pixeltable/functions/image.py +155 -84
pixeltable/functions/json.py +8 -11
pixeltable/functions/llama_cpp.py +31 -19
pixeltable/functions/math.py +169 -0
pixeltable/functions/mistralai.py +50 -75
pixeltable/functions/net.py +70 -0
pixeltable/functions/ollama.py +29 -36
pixeltable/functions/openai.py +548 -160
pixeltable/functions/openrouter.py +143 -0
pixeltable/functions/replicate.py +15 -14
pixeltable/functions/reve.py +250 -0
pixeltable/functions/string.py +310 -85
pixeltable/functions/timestamp.py +37 -19
pixeltable/functions/together.py +77 -120
pixeltable/functions/twelvelabs.py +188 -0
pixeltable/functions/util.py +7 -2
pixeltable/functions/uuid.py +30 -0
pixeltable/functions/video.py +1528 -117
pixeltable/functions/vision.py +26 -26
pixeltable/functions/voyageai.py +289 -0
pixeltable/functions/whisper.py +19 -10
pixeltable/functions/whisperx.py +179 -0
pixeltable/functions/yolox.py +112 -0
pixeltable/globals.py +716 -236
pixeltable/index/__init__.py +3 -1
pixeltable/index/base.py +17 -21
pixeltable/index/btree.py +32 -22
pixeltable/index/embedding_index.py +155 -92
pixeltable/io/__init__.py +12 -7
pixeltable/io/datarows.py +140 -0
pixeltable/io/external_store.py +83 -125
pixeltable/io/fiftyone.py +24 -33
pixeltable/io/globals.py +47 -182
pixeltable/io/hf_datasets.py +96 -127
pixeltable/io/label_studio.py +171 -156
pixeltable/io/lancedb.py +3 -0
pixeltable/io/pandas.py +136 -115
pixeltable/io/parquet.py +40 -153
pixeltable/io/table_data_conduit.py +702 -0
pixeltable/io/utils.py +100 -0
pixeltable/iterators/__init__.py +8 -4
pixeltable/iterators/audio.py +207 -0
pixeltable/iterators/base.py +9 -3
pixeltable/iterators/document.py +144 -87
pixeltable/iterators/image.py +17 -38
pixeltable/iterators/string.py +15 -12
pixeltable/iterators/video.py +523 -127
pixeltable/metadata/__init__.py +33 -8
pixeltable/metadata/converters/convert_10.py +2 -3
pixeltable/metadata/converters/convert_13.py +2 -2
pixeltable/metadata/converters/convert_15.py +15 -11
pixeltable/metadata/converters/convert_16.py +4 -5
pixeltable/metadata/converters/convert_17.py +4 -5
pixeltable/metadata/converters/convert_18.py +4 -6
pixeltable/metadata/converters/convert_19.py +6 -9
pixeltable/metadata/converters/convert_20.py +3 -6
pixeltable/metadata/converters/convert_21.py +6 -8
pixeltable/metadata/converters/convert_22.py +3 -2
pixeltable/metadata/converters/convert_23.py +33 -0
pixeltable/metadata/converters/convert_24.py +55 -0
pixeltable/metadata/converters/convert_25.py +19 -0
pixeltable/metadata/converters/convert_26.py +23 -0
pixeltable/metadata/converters/convert_27.py +29 -0
pixeltable/metadata/converters/convert_28.py +13 -0
pixeltable/metadata/converters/convert_29.py +110 -0
pixeltable/metadata/converters/convert_30.py +63 -0
pixeltable/metadata/converters/convert_31.py +11 -0
pixeltable/metadata/converters/convert_32.py +15 -0
pixeltable/metadata/converters/convert_33.py +17 -0
pixeltable/metadata/converters/convert_34.py +21 -0
pixeltable/metadata/converters/convert_35.py +9 -0
pixeltable/metadata/converters/convert_36.py +38 -0
pixeltable/metadata/converters/convert_37.py +15 -0
pixeltable/metadata/converters/convert_38.py +39 -0
pixeltable/metadata/converters/convert_39.py +124 -0
pixeltable/metadata/converters/convert_40.py +73 -0
pixeltable/metadata/converters/convert_41.py +12 -0
pixeltable/metadata/converters/convert_42.py +9 -0
pixeltable/metadata/converters/convert_43.py +44 -0
pixeltable/metadata/converters/util.py +44 -18
pixeltable/metadata/notes.py +21 -0
pixeltable/metadata/schema.py +185 -42
pixeltable/metadata/utils.py +74 -0
pixeltable/mypy/__init__.py +3 -0
pixeltable/mypy/mypy_plugin.py +123 -0
pixeltable/plan.py +616 -225
pixeltable/share/__init__.py +3 -0
pixeltable/share/packager.py +797 -0
pixeltable/share/protocol/__init__.py +33 -0
pixeltable/share/protocol/common.py +165 -0
pixeltable/share/protocol/operation_types.py +33 -0
pixeltable/share/protocol/replica.py +119 -0
pixeltable/share/publish.py +349 -0
pixeltable/store.py +398 -232
pixeltable/type_system.py +730 -267
pixeltable/utils/__init__.py +40 -0
pixeltable/utils/arrow.py +201 -29
pixeltable/utils/av.py +298 -0
pixeltable/utils/azure_store.py +346 -0
pixeltable/utils/coco.py +26 -27
pixeltable/utils/code.py +4 -4
pixeltable/utils/console_output.py +46 -0
pixeltable/utils/coroutine.py +24 -0
pixeltable/utils/dbms.py +92 -0
pixeltable/utils/description_helper.py +11 -12
pixeltable/utils/documents.py +60 -61
pixeltable/utils/exception_handler.py +36 -0
pixeltable/utils/filecache.py +38 -22
pixeltable/utils/formatter.py +88 -51
pixeltable/utils/gcs_store.py +295 -0
pixeltable/utils/http.py +133 -0
pixeltable/utils/http_server.py +14 -13
pixeltable/utils/iceberg.py +13 -0
pixeltable/utils/image.py +17 -0
pixeltable/utils/lancedb.py +90 -0
pixeltable/utils/local_store.py +322 -0
pixeltable/utils/misc.py +5 -0
pixeltable/utils/object_stores.py +573 -0
pixeltable/utils/pydantic.py +60 -0
pixeltable/utils/pytorch.py +20 -20
pixeltable/utils/s3_store.py +527 -0
pixeltable/utils/sql.py +32 -5
pixeltable/utils/system.py +30 -0
pixeltable/utils/transactional_directory.py +4 -3
pixeltable-0.5.7.dist-info/METADATA +579 -0
pixeltable-0.5.7.dist-info/RECORD +227 -0
{pixeltable-0.2.26.dist-info → pixeltable-0.5.7.dist-info}/WHEEL +1 -1
pixeltable-0.5.7.dist-info/entry_points.txt +2 -0
pixeltable/__version__.py +0 -3
pixeltable/catalog/named_function.py +0 -36
pixeltable/catalog/path_dict.py +0 -141
pixeltable/dataframe.py +0 -894
pixeltable/exec/expr_eval_node.py +0 -232
pixeltable/ext/__init__.py +0 -14
pixeltable/ext/functions/__init__.py +0 -8
pixeltable/ext/functions/whisperx.py +0 -77
pixeltable/ext/functions/yolox.py +0 -157
pixeltable/tool/create_test_db_dump.py +0 -311
pixeltable/tool/create_test_video.py +0 -81
pixeltable/tool/doc_plugins/griffe.py +0 -50
pixeltable/tool/doc_plugins/mkdocstrings.py +0 -6
pixeltable/tool/doc_plugins/templates/material/udf.html.jinja +0 -135
pixeltable/tool/embed_udf.py +0 -9
pixeltable/tool/mypy_plugin.py +0 -55
pixeltable/utils/media_store.py +0 -76
pixeltable/utils/s3.py +0 -16
pixeltable-0.2.26.dist-info/METADATA +0 -400
pixeltable-0.2.26.dist-info/RECORD +0 -156
pixeltable-0.2.26.dist-info/entry_points.txt +0 -3
{pixeltable-0.2.26.dist-info → pixeltable-0.5.7.dist-info/licenses}/LICENSE +0 -0

pixeltable/functions/openai.py CHANGED Viewed

@@ -1,49 +1,253 @@
 """
-Pixeltable [UDFs](https://pixeltable.readme.io/docs/user-defined-functions-udfs)
+Pixeltable UDFs
 that wrap various endpoints from the OpenAI API. In order to use them, you must
 first `pip install openai` and configure your OpenAI credentials, as described in
-the [Working with OpenAI](https://pixeltable.readme.io/docs/working-with-openai) tutorial.
+the [Working with OpenAI](https://docs.pixeltable.com/notebooks/integrations/working-with-openai) tutorial.
 """
 import base64
+import datetime
 import io
+import json
+import logging
+import math
 import pathlib
-import uuid
-from typing import TYPE_CHECKING, Callable, Optional, TypeVar, Union
+import re
+from typing import TYPE_CHECKING, Any, Callable, Type
+import httpx
 import numpy as np
-import PIL.Image
-import tenacity
+import PIL
 import pixeltable as pxt
-from pixeltable import env
-from pixeltable.func import Batch
+from pixeltable import env, exprs, type_system as ts
+from pixeltable.config import Config
+from pixeltable.func import Batch, Tools
 from pixeltable.utils.code import local_public_names
+from pixeltable.utils.local_store import TempStore
+from pixeltable.utils.system import set_file_descriptor_limit
 if TYPE_CHECKING:
     import openai
+_logger = logging.getLogger('pixeltable')
 @env.register_client('openai')
-def _(api_key: str) -> 'openai.OpenAI':
+def _(api_key: str, base_url: str | None = None, api_version: str | None = None) -> 'openai.AsyncOpenAI':
     import openai
-    return openai.OpenAI(api_key=api_key)
+    max_connections = Config.get().get_int_value('openai.max_connections') or 2000
+    max_keepalive_connections = Config.get().get_int_value('openai.max_keepalive_connections') or 100
+    set_file_descriptor_limit(max_connections * 2)
+    default_query = None if api_version is None else {'api-version': api_version}
+    # Pixeltable scheduler's retry logic takes into account the rate limit-related response headers, so in theory we can
+    # benefit from disabling retries in the OpenAI client (max_retries=0). However to do that, we need to get smarter
+    # about idempotency keys and possibly more.
+    return openai.AsyncOpenAI(
+        api_key=api_key,
+        base_url=base_url,
+        default_query=default_query,
+        # recommended to increase limits for async client to avoid connection errors
+        http_client=httpx.AsyncClient(
+            limits=httpx.Limits(max_keepalive_connections=max_keepalive_connections, max_connections=max_connections),
+            # HTTP1 tends to perform better on this kind of workloads
+            http2=False,
+            http1=True,
+        ),
+    )
-def _openai_client() -> 'openai.OpenAI':
+def _openai_client() -> 'openai.AsyncOpenAI':
     return env.Env.get().get_client('openai')
-# Exponential backoff decorator using tenacity.
-# TODO(aaron-siegel): Right now this hardwires random exponential backoff with defaults suggested
-# by OpenAI. Should we investigate making this more customizable in the future?
-def _retry(fn: Callable) -> Callable:
-    import openai
-    return tenacity.retry(
-        retry=tenacity.retry_if_exception_type(openai.RateLimitError),
-        wait=tenacity.wait_random_exponential(multiplier=1, max=60),
-        stop=tenacity.stop_after_attempt(20),
-    )(fn)
+# models that share rate limits; see https://platform.openai.com/settings/organization/limits for details
+_shared_rate_limits = {
+    'gpt-4-turbo': [
+        'gpt-4-turbo',
+        'gpt-4-turbo-latest',
+        'gpt-4-turbo-2024-04-09',
+        'gpt-4-turbo-preview',
+        'gpt-4-0125-preview',
+        'gpt-4-1106-preview',
+    ],
+    'gpt-4o': [
+        'gpt-4o',
+        'gpt-4o-latest',
+        'gpt-4o-2024-05-13',
+        'gpt-4o-2024-08-06',
+        'gpt-4o-2024-11-20',
+        'gpt-4o-audio-preview',
+        'gpt-4o-audio-preview-2024-10-01',
+        'gpt-4o-audio-preview-2024-12-17',
+    ],
+    'gpt-4o-mini': [
+        'gpt-4o-mini',
+        'gpt-4o-mini-latest',
+        'gpt-4o-mini-2024-07-18',
+        'gpt-4o-mini-audio-preview',
+        'gpt-4o-mini-audio-preview-2024-12-17',
+    ],
+    'gpt-4o-mini-realtime-preview': [
+        'gpt-4o-mini-realtime-preview',
+        'gpt-4o-mini-realtime-preview-latest',
+        'gpt-4o-mini-realtime-preview-2024-12-17',
+    ],
+}
+def _rate_limits_pool(model: str) -> str:
+    for model_family, models in _shared_rate_limits.items():
+        if model in models:
+            return f'rate-limits:openai:{model_family}'
+    return f'rate-limits:openai:{model}'
+def _parse_header_duration(duration_str: str) -> float | None:
+    """Parses the value of x-ratelimit-reset-* header into seconds.
+    Returns None if the input cannot be parsed.
+    Real life examples of header values:
+    * '1m33.792s'
+    * '857ms'
+    * '0s'
+    * '47.874s'
+    * '156h58m48.601s'
+    """
+    if duration_str is None or duration_str.strip() == '':
+        return None
+    units = {
+        86400: r'(\d+)d',  # days
+        3600: r'(\d+)h',  # hours
+        60: r'(\d+)m(?:[^s]|$)',  # minutes
+        1: r'([\d.]+)s',  # seconds
+        0.001: r'(\d+)ms',  # millis
+    }
+    seconds = None
+    for unit_value, pattern in units.items():
+        match = re.search(pattern, duration_str)
+        if match:
+            seconds = seconds or 0.0
+            seconds += float(match.group(1)) * unit_value
+    _logger.debug(f'Parsed duration header value "{duration_str}" into {seconds} seconds')
+    return seconds
+def _get_header_info(
+    headers: httpx.Headers,
+) -> tuple[tuple[int, int, datetime.datetime] | None, tuple[int, int, datetime.datetime] | None]:
+    """Parses rate limit related headers"""
+    # Requests and project-requests are two separate limits of requests per minute. project-requests headers will be
+    # present if an RPM limit is configured on the project limit.
+    requests_info = _get_resource_info(headers, 'requests')
+    requests_fraction_remaining = _fract_remaining(requests_info)
+    project_requests_info = _get_resource_info(headers, 'project-requests')
+    project_requests_fraction_remaining = _fract_remaining(project_requests_info)
+    # If both limit infos are present, pick the one with the least percentage remaining
+    best_requests_info = requests_info or project_requests_info
+    if (
+        requests_fraction_remaining is not None
+        and project_requests_fraction_remaining is not None
+        and project_requests_fraction_remaining < requests_fraction_remaining
+    ):
+        best_requests_info = project_requests_info
+    # Same story with tokens
+    tokens_info = _get_resource_info(headers, 'tokens')
+    tokens_fraction_remaining = _fract_remaining(tokens_info)
+    project_tokens_info = _get_resource_info(headers, 'project-tokens')
+    project_tokens_fraction_remaining = _fract_remaining(project_tokens_info)
+    best_tokens_info = tokens_info or project_tokens_info
+    if (
+        tokens_fraction_remaining is not None
+        and project_tokens_fraction_remaining is not None
+        and project_tokens_fraction_remaining < tokens_fraction_remaining
+    ):
+        best_tokens_info = project_tokens_info
+    if best_requests_info is None or best_tokens_info is None:
+        _logger.debug(f'get_header_info(): incomplete rate limit info: {headers}')
+    return best_requests_info, best_tokens_info
+def _get_resource_info(headers: httpx.Headers, resource: str) -> tuple[int, int, datetime.datetime] | None:
+    remaining_str = headers.get(f'x-ratelimit-remaining-{resource}')
+    if remaining_str is None:
+        return None
+    remaining = int(remaining_str)
+    limit_str = headers.get(f'x-ratelimit-limit-{resource}')
+    limit = int(limit_str) if limit_str is not None else None
+    reset_str = headers.get(f'x-ratelimit-reset-{resource}')
+    reset_in_seconds = _parse_header_duration(reset_str) or 5.0  # Default to 5 seconds
+    reset_ts = datetime.datetime.now(tz=datetime.timezone.utc) + datetime.timedelta(seconds=reset_in_seconds)
+    return (limit, remaining, reset_ts)
+def _fract_remaining(resource_info: tuple[int, int, datetime.datetime] | None) -> float | None:
+    if resource_info is None:
+        return None
+    limit, remaining, _ = resource_info
+    if limit is None or remaining is None:
+        return None
+    return remaining / limit
+class OpenAIRateLimitsInfo(env.RateLimitsInfo):
+    retryable_errors: tuple[Type[Exception], ...]
+    def __init__(self, get_request_resources: Callable[..., dict[str, int]]):
+        super().__init__(get_request_resources)
+        import openai
+        self.retryable_errors = (
+            # ConnectionError: we occasionally see this error when the AsyncConnectionPool is trying to close
+            # expired connections
+            # (AsyncConnectionPool._close_expired_connections() fails with ConnectionError when executing
+            # 'await connection.aclose()', which is very likely a bug in AsyncConnectionPool)
+            openai.APIConnectionError,
+            # the following errors are retryable according to OpenAI's API documentation
+            openai.RateLimitError,
+            openai.APITimeoutError,
+            openai.UnprocessableEntityError,
+            openai.InternalServerError,
+        )
+    def record_exc(self, request_ts: datetime.datetime, exc: Exception) -> None:
+        import openai
+        _ = isinstance(exc, openai.APIError)
+        if not isinstance(exc, openai.APIError) or not hasattr(exc, 'response') or not hasattr(exc.response, 'headers'):
+            return
+        requests_info, tokens_info = _get_header_info(exc.response.headers)
+        _logger.debug(
+            f'record_exc(): request_ts: {request_ts}, requests_info={requests_info} tokens_info={tokens_info}'
+        )
+        self.record(request_ts=request_ts, requests=requests_info, tokens=tokens_info)
+        self.has_exc = True
+    def _retry_delay_from_exception(self, exc: Exception) -> float | None:
+        try:
+            retry_after_str = exc.response.headers.get('retry-after')  # type: ignore
+        except AttributeError:
+            return None
+        if retry_after_str is not None and re.fullmatch(r'\d{1,4}', retry_after_str):
+            return float(retry_after_str)
+        return None
+    def get_retry_delay(self, exc: Exception, attempt: int) -> float | None:
+        import openai
+        if not isinstance(exc, self.retryable_errors):
+            return None
+        assert isinstance(exc, openai.APIError)
+        return self._retry_delay_from_exception(exc) or super().get_retry_delay(exc, attempt)
 #####################################
@@ -51,14 +255,16 @@ def _retry(fn: Callable) -> Callable:
 @pxt.udf
-def speech(
-    input: str, *, model: str, voice: str, response_format: Optional[str] = None, speed: Optional[float] = None
-) -> pxt.Audio:
+async def speech(input: str, *, model: str, voice: str, model_kwargs: dict[str, Any] | None = None) -> pxt.Audio:
     """
     Generates audio from the input text.
     Equivalent to the OpenAI `audio/speech` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/text-to-speech](https://platform.openai.com/docs/guides/text-to-speech)
+    For additional details, see: <https://platform.openai.com/docs/guides/text-to-speech>
+    Request throttling:
+    Applies the rate limit set in the config (section `openai.rate_limits`; use the model id as the key). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -69,8 +275,8 @@ def speech(
         model: The model to use for speech synthesis.
         voice: The voice profile to use for speech synthesis. Supported options include:
             `alloy`, `echo`, `fable`, `onyx`, `nova`, and `shimmer`.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/audio/createSpeech](https://platform.openai.com/docs/api-reference/audio/createSpeech)
+        model_kwargs: Additional keyword args for the OpenAI `audio/speech` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/audio/createSpeech>
     Returns:
         An audio file containing the synthesized speech.
@@ -79,31 +285,29 @@ def speech(
         Add a computed column that applies the model `tts-1` to an existing Pixeltable column `tbl.text`
         of the table `tbl`:
-        >>> tbl['audio'] = speech(tbl.text, model='tts-1', voice='nova')
+        >>> tbl.add_computed_column(audio=speech(tbl.text, model='tts-1', voice='nova'))
     """
-    content = _retry(_openai_client().audio.speech.create)(
-        input=input, model=model, voice=voice, response_format=_opt(response_format), speed=_opt(speed)
-    )
-    ext = response_format or 'mp3'
-    output_filename = str(env.Env.get().tmp_dir / f'{uuid.uuid4()}.{ext}')
+    if model_kwargs is None:
+        model_kwargs = {}
+    content = await _openai_client().audio.speech.create(input=input, model=model, voice=voice, **model_kwargs)
+    ext = model_kwargs.get('response_format', 'mp3')
+    output_filename = str(TempStore.create_path(extension=f'.{ext}'))
     content.write_to_file(output_filename)
     return output_filename
 @pxt.udf
-def transcriptions(
-    audio: pxt.Audio,
-    *,
-    model: str,
-    language: Optional[str] = None,
-    prompt: Optional[str] = None,
-    temperature: Optional[float] = None,
-) -> dict:
+async def transcriptions(audio: pxt.Audio, *, model: str, model_kwargs: dict[str, Any] | None = None) -> dict:
     """
     Transcribes audio into the input language.
     Equivalent to the OpenAI `audio/transcriptions` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/speech-to-text](https://platform.openai.com/docs/guides/speech-to-text)
+    For additional details, see: <https://platform.openai.com/docs/guides/speech-to-text>
+    Request throttling:
+    Applies the rate limit set in the config (section `openai.rate_limits`; use the model id as the key). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -112,8 +316,8 @@ def transcriptions(
     Args:
         audio: The audio to transcribe.
         model: The model to use for speech transcription.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/audio/createTranscription](https://platform.openai.com/docs/api-reference/audio/createTranscription)
+        model_kwargs: Additional keyword args for the OpenAI `audio/transcriptions` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/audio/createTranscription>
     Returns:
         A dictionary containing the transcription and other metadata.
@@ -122,28 +326,27 @@ def transcriptions(
         Add a computed column that applies the model `whisper-1` to an existing Pixeltable column `tbl.audio`
         of the table `tbl`:
-        >>> tbl['transcription'] = transcriptions(tbl.audio, model='whisper-1', language='en')
+        >>> tbl.add_computed_column(transcription=transcriptions(tbl.audio, model='whisper-1', language='en'))
     """
+    if model_kwargs is None:
+        model_kwargs = {}
     file = pathlib.Path(audio)
-    transcription = _retry(_openai_client().audio.transcriptions.create)(
-        file=file, model=model, language=_opt(language), prompt=_opt(prompt), temperature=_opt(temperature)
-    )
+    transcription = await _openai_client().audio.transcriptions.create(file=file, model=model, **model_kwargs)
     return transcription.dict()
 @pxt.udf
-def translations(
-    audio: pxt.Audio,
-    *,
-    model: str,
-    prompt: Optional[str] = None,
-    temperature: Optional[float] = None
-) -> dict:
+async def translations(audio: pxt.Audio, *, model: str, model_kwargs: dict[str, Any] | None = None) -> dict:
     """
     Translates audio into English.
     Equivalent to the OpenAI `audio/translations` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/speech-to-text](https://platform.openai.com/docs/guides/speech-to-text)
+    For additional details, see: <https://platform.openai.com/docs/guides/speech-to-text>
+    Request throttling:
+    Applies the rate limit set in the config (section `openai.rate_limits`; use the model id as the key). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -152,8 +355,8 @@ def translations(
     Args:
         audio: The audio to translate.
         model: The model to use for speech transcription and translation.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/audio/createTranslation](https://platform.openai.com/docs/api-reference/audio/createTranslation)
+        model_kwargs: Additional keyword args for the OpenAI `audio/translations` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/audio/createTranslation>
     Returns:
         A dictionary containing the translation and other metadata.
@@ -162,12 +365,13 @@ def translations(
         Add a computed column that applies the model `whisper-1` to an existing Pixeltable column `tbl.audio`
         of the table `tbl`:
-        >>> tbl['translation'] = translations(tbl.audio, model='whisper-1', language='en')
+        >>> tbl.add_computed_column(translation=translations(tbl.audio, model='whisper-1', language='en'))
     """
+    if model_kwargs is None:
+        model_kwargs = {}
     file = pathlib.Path(audio)
-    translation = _retry(_openai_client().audio.translations.create)(
-        file=file, model=model, prompt=_opt(prompt), temperature=_opt(temperature)
-    )
+    translation = await _openai_client().audio.translations.create(file=file, model=model, **model_kwargs)
     return translation.dict()
@@ -175,32 +379,75 @@ def translations(
 # Chat Endpoints
+def _default_max_tokens(model: str) -> int:
+    if (
+        _is_model_family(model, 'gpt-4o-realtime')
+        or _is_model_family(model, 'gpt-4o-mini-realtime')
+        or _is_model_family(model, 'gpt-4-turbo')
+        or _is_model_family(model, 'gpt-3.5-turbo')
+    ):
+        return 4096
+    if _is_model_family(model, 'gpt-4'):
+        return 8192  # All other gpt-4 models (will not match on gpt-4o models)
+    if _is_model_family(model, 'gpt-4o') or _is_model_family(model, 'gpt-4.5-preview'):
+        return 16384  # All other gpt-4o / gpt-4.5 models
+    if _is_model_family(model, 'o1-preview'):
+        return 32768
+    if _is_model_family(model, 'o1-mini'):
+        return 65536
+    if _is_model_family(model, 'o1') or _is_model_family(model, 'o3'):
+        return 100000  # All other o1 / o3 models
+    return 100000  # global default
+def _is_model_family(model: str, family: str) -> bool:
+    # `model.startswith(family)` would be a simpler match, but increases the risk of false positives.
+    # We use a slightly more complicated criterion to make things a little less error prone.
+    return model == family or model.startswith(f'{family}-')
+def _chat_completions_get_request_resources(
+    messages: list, model: str, model_kwargs: dict[str, Any] | None
+) -> dict[str, int]:
+    if model_kwargs is None:
+        model_kwargs = {}
+    max_completion_tokens = model_kwargs.get('max_completion_tokens')
+    max_tokens = model_kwargs.get('max_tokens')
+    n = model_kwargs.get('n')
+    completion_tokens = (n or 1) * (max_completion_tokens or max_tokens or _default_max_tokens(model))
+    num_tokens = 0.0
+    for message in messages:
+        num_tokens += 4  # every message follows <im_start>{role/name}\n{content}<im_end>\n
+        for key, value in message.items():
+            num_tokens += len(value) / 4
+            if key == 'name':  # if there's a name, the role is omitted
+                num_tokens -= 1  # role is always required and always 1 token
+    num_tokens += 2  # every reply is primed with <im_start>assistant
+    return {'requests': 1, 'tokens': int(num_tokens) + completion_tokens}
 @pxt.udf
-def chat_completions(
+async def chat_completions(
     messages: list,
     *,
     model: str,
-    frequency_penalty: Optional[float] = None,
-    logit_bias: Optional[dict[str, int]] = None,
-    logprobs: Optional[bool] = None,
-    top_logprobs: Optional[int] = None,
-    max_tokens: Optional[int] = None,
-    n: Optional[int] = None,
-    presence_penalty: Optional[float] = None,
-    response_format: Optional[dict] = None,
-    seed: Optional[int] = None,
-    stop: Optional[list[str]] = None,
-    temperature: Optional[float] = None,
-    top_p: Optional[float] = None,
-    tools: Optional[list[dict]] = None,
-    tool_choice: Optional[dict] = None,
-    user: Optional[str] = None,
+    model_kwargs: dict[str, Any] | None = None,
+    tools: list[dict[str, Any]] | None = None,
+    tool_choice: dict[str, Any] | None = None,
+    _runtime_ctx: env.RuntimeCtx | None = None,
 ) -> dict:
     """
     Creates a model response for the given chat conversation.
     Equivalent to the OpenAI `chat/completions` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/chat-completions](https://platform.openai.com/docs/guides/chat-completions)
+    For additional details, see: <https://platform.openai.com/docs/guides/chat-completions>
+    Request throttling:
+    Uses the rate limit-related headers returned by the API to throttle requests adaptively, based on available
+    request and token capacity. No configuration is necessary.
     __Requirements:__
@@ -209,8 +456,8 @@ def chat_completions(
     Args:
         messages: A list of messages to use for chat completion, as described in the OpenAI API documentation.
         model: The model to use for chat completion.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/chat](https://platform.openai.com/docs/api-reference/chat)
+        model_kwargs: Additional keyword args for the OpenAI `chat/completions` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/chat/create>
     Returns:
         A dictionary containing the response and other metadata.
@@ -220,40 +467,101 @@ def chat_completions(
         of the table `tbl`:
         >>> messages = [
-                {'role': 'system', 'content': 'You are a helpful assistant.'},
-                {'role': 'user', 'content': tbl.prompt}
-            ]
-            tbl['response'] = chat_completions(messages, model='gpt-4o-mini')
+        ...     {'role': 'system', 'content': 'You are a helpful assistant.'},
+        ...     {'role': 'user', 'content': tbl.prompt}
+        ... ]
+        >>> tbl.add_computed_column(response=chat_completions(messages, model='gpt-4o-mini'))
     """
-    result = _retry(_openai_client().chat.completions.create)(
-        messages=messages,
-        model=model,
-        frequency_penalty=_opt(frequency_penalty),
-        logit_bias=_opt(logit_bias),
-        logprobs=_opt(logprobs),
-        top_logprobs=_opt(top_logprobs),
-        max_tokens=_opt(max_tokens),
-        n=_opt(n),
-        presence_penalty=_opt(presence_penalty),
-        response_format=_opt(response_format),
-        seed=_opt(seed),
-        stop=_opt(stop),
-        temperature=_opt(temperature),
-        top_p=_opt(top_p),
-        tools=_opt(tools),
-        tool_choice=_opt(tool_choice),
-        user=_opt(user),
+    if model_kwargs is None:
+        model_kwargs = {}
+    if tools is not None:
+        model_kwargs['tools'] = [{'type': 'function', 'function': tool} for tool in tools]
+    if tool_choice is not None:
+        if tool_choice['auto']:
+            model_kwargs['tool_choice'] = 'auto'
+        elif tool_choice['required']:
+            model_kwargs['tool_choice'] = 'required'
+        else:
+            assert tool_choice['tool'] is not None
+            model_kwargs['tool_choice'] = {'type': 'function', 'function': {'name': tool_choice['tool']}}
+    if tool_choice is not None and not tool_choice['parallel_tool_calls']:
+        model_kwargs['parallel_tool_calls'] = False
+    # make sure the pool info exists prior to making the request
+    resource_pool = _rate_limits_pool(model)
+    rate_limits_info = env.Env.get().get_resource_pool_info(
+        resource_pool, lambda: OpenAIRateLimitsInfo(_chat_completions_get_request_resources)
     )
-    return result.dict()
+    request_ts = datetime.datetime.now(tz=datetime.timezone.utc)
+    result = await _openai_client().chat.completions.with_raw_response.create(
+        messages=messages, model=model, **model_kwargs
+    )
+    requests_info, tokens_info = _get_header_info(result.headers)
+    is_retry = _runtime_ctx is not None and _runtime_ctx.is_retry
+    rate_limits_info.record(request_ts=request_ts, requests=requests_info, tokens=tokens_info, reset_exc=is_retry)
+    return json.loads(result.text)
+def _vision_get_request_resources(
+    prompt: str, image: PIL.Image.Image, model: str, model_kwargs: dict[str, Any] | None = None
+) -> dict[str, int]:
+    if model_kwargs is None:
+        model_kwargs = {}
+    max_completion_tokens = model_kwargs.get('max_completion_tokens')
+    max_tokens = model_kwargs.get('max_tokens')
+    n = model_kwargs.get('n')
+    completion_tokens = (n or 1) * (max_completion_tokens or max_tokens or _default_max_tokens(model))
+    prompt_tokens = len(prompt) / 4
+    # calculate image tokens based on
+    # https://platform.openai.com/docs/guides/vision/calculating-costs#calculating-costs
+    # assuming detail='high' (which appears to be the default, according to community forum posts)
+    # number of 512x512 crops; ceil(): partial crops still count as full crops
+    crops_width = math.ceil(image.width / 512)
+    crops_height = math.ceil(image.height / 512)
+    total_crops = crops_width * crops_height
+    base_tokens = 85  # base cost for the initial 512x512 overview
+    crop_tokens = 170  # cost per additional 512x512 crop
+    img_tokens = base_tokens + (crop_tokens * total_crops)
+    total_tokens = (
+        prompt_tokens
+        + img_tokens
+        + completion_tokens
+        + 4  # for <im_start>{role/name}\n{content}<im_end>\n
+        + 2  # for reply's <im_start>assistant
+    )
+    return {'requests': 1, 'tokens': int(total_tokens)}
 @pxt.udf
-def vision(prompt: str, image: PIL.Image.Image, *, model: str) -> str:
+async def vision(
+    prompt: str,
+    image: PIL.Image.Image,
+    *,
+    model: str,
+    model_kwargs: dict[str, Any] | None = None,
+    _runtime_ctx: env.RuntimeCtx | None = None,
+) -> str:
     """
     Analyzes an image with the OpenAI vision capability. This is a convenience function that takes an image and
     prompt, and constructs a chat completion request that utilizes OpenAI vision.
-    For additional details, see: [https://platform.openai.com/docs/guides/vision](https://platform.openai.com/docs/guides/vision)
+    For additional details, see: <https://platform.openai.com/docs/guides/vision>
+    Request throttling:
+    Uses the rate limit-related headers returned by the API to throttle requests adaptively, based on available
+    request and token capacity. No configuration is necessary.
     __Requirements:__
@@ -271,8 +579,11 @@ def vision(prompt: str, image: PIL.Image.Image, *, model: str) -> str:
         Add a computed column that applies the model `gpt-4o-mini` to an existing Pixeltable column `tbl.image`
         of the table `tbl`:
-        >>> tbl['response'] = vision("What's in this image?", tbl.image, model='gpt-4o-mini')
+        >>> tbl.add_computed_column(response=vision("What's in this image?", tbl.image, model='gpt-4o-mini'))
     """
+    if model_kwargs is None:
+        model_kwargs = {}
     # TODO(aaron-siegel): Decompose CPU/GPU ops into separate functions
     bytes_arr = io.BytesIO()
     image.save(bytes_arr, format='png')
@@ -287,8 +598,27 @@ def vision(prompt: str, image: PIL.Image.Image, *, model: str) -> str:
             ],
         }
     ]
-    result = _retry(_openai_client().chat.completions.create)(messages=messages, model=model)
-    return result.choices[0].message.content
+    # make sure the pool info exists prior to making the request
+    resource_pool = _rate_limits_pool(model)
+    rate_limits_info = env.Env.get().get_resource_pool_info(
+        resource_pool, lambda: OpenAIRateLimitsInfo(_vision_get_request_resources)
+    )
+    request_ts = datetime.datetime.now(tz=datetime.timezone.utc)
+    result = await _openai_client().chat.completions.with_raw_response.create(
+        messages=messages,  # type: ignore
+        model=model,
+        **model_kwargs,
+    )
+    # _logger.debug(f'vision(): headers={result.headers}')
+    requests_info, tokens_info = _get_header_info(result.headers)
+    is_retry = _runtime_ctx is not None and _runtime_ctx.is_retry
+    rate_limits_info.record(request_ts=request_ts, requests=requests_info, tokens=tokens_info, reset_exc=is_retry)
+    result = json.loads(result.text)
+    return result['choices'][0]['message']['content']
 #####################################
@@ -301,15 +631,28 @@ _embedding_dimensions_cache: dict[str, int] = {
 }
+def _embeddings_get_request_resources(input: list[str]) -> dict[str, int]:
+    input_len = sum(len(s) for s in input)
+    return {'requests': 1, 'tokens': int(input_len / 4)}
 @pxt.udf(batch_size=32)
-def embeddings(
-    input: Batch[str], *, model: str, dimensions: Optional[int] = None, user: Optional[str] = None
+async def embeddings(
+    input: Batch[str],
+    *,
+    model: str,
+    model_kwargs: dict[str, Any] | None = None,
+    _runtime_ctx: env.RuntimeCtx | None = None,
 ) -> Batch[pxt.Array[(None,), pxt.Float]]:
     """
     Creates an embedding vector representing the input text.
     Equivalent to the OpenAI `embeddings` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/embeddings](https://platform.openai.com/docs/guides/embeddings)
+    For additional details, see: <https://platform.openai.com/docs/guides/embeddings>
+    Request throttling:
+    Uses the rate limit-related headers returned by the API to throttle requests adaptively, based on available
+    request and token capacity. No configuration is necessary.
     __Requirements:__
@@ -318,10 +661,8 @@ def embeddings(
     Args:
         input: The text to embed.
         model: The model to use for the embedding.
-        dimensions: The vector length of the embedding. If not specified, Pixeltable will use
-            a default value based on the model.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/embeddings](https://platform.openai.com/docs/api-reference/embeddings)
+        model_kwargs: Additional keyword args for the OpenAI `embeddings` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/embeddings>
     Returns:
         An array representing the application of the given embedding to `input`.
@@ -330,22 +671,41 @@ def embeddings(
         Add a computed column that applies the model `text-embedding-3-small` to an existing
         Pixeltable column `tbl.text` of the table `tbl`:
-        >>> tbl['embed'] = embeddings(tbl.text, model='text-embedding-3-small')
+        >>> tbl.add_computed_column(embed=embeddings(tbl.text, model='text-embedding-3-small'))
+        Add an embedding index to an existing column `text`, using the model `text-embedding-3-small`:
+        >>> tbl.add_embedding_index(embedding=embeddings.using(model='text-embedding-3-small'))
     """
-    result = _retry(_openai_client().embeddings.create)(
-        input=input, model=model, dimensions=_opt(dimensions), user=_opt(user), encoding_format='float'
+    if model_kwargs is None:
+        model_kwargs = {}
+    _logger.debug(f'embeddings: batch_size={len(input)}')
+    resource_pool = _rate_limits_pool(model)
+    rate_limits_info = env.Env.get().get_resource_pool_info(
+        resource_pool, lambda: OpenAIRateLimitsInfo(_embeddings_get_request_resources)
+    )
+    request_ts = datetime.datetime.now(tz=datetime.timezone.utc)
+    result = await _openai_client().embeddings.with_raw_response.create(
+        input=input, model=model, encoding_format='float', **model_kwargs
     )
-    return [np.array(data.embedding, dtype=np.float64) for data in result.data]
+    requests_info, tokens_info = _get_header_info(result.headers)
+    is_retry = _runtime_ctx is not None and _runtime_ctx.is_retry
+    rate_limits_info.record(request_ts=request_ts, requests=requests_info, tokens=tokens_info, reset_exc=is_retry)
+    return [np.array(data['embedding'], dtype=np.float64) for data in json.loads(result.content)['data']]
 @embeddings.conditional_return_type
-def _(model: str, dimensions: Optional[int] = None) -> pxt.ArrayType:
+def _(model: str, model_kwargs: dict[str, Any] | None = None) -> ts.ArrayType:
+    dimensions: int | None = None
+    if model_kwargs is not None:
+        dimensions = model_kwargs.get('dimensions')
     if dimensions is None:
         if model not in _embedding_dimensions_cache:
             # TODO: find some other way to retrieve a sample
-            return pxt.ArrayType((None,), dtype=pxt.FloatType(), nullable=False)
-        dimensions = _embedding_dimensions_cache.get(model, None)
-    return pxt.ArrayType((dimensions,), dtype=pxt.FloatType(), nullable=False)
+            return ts.ArrayType((None,), dtype=ts.FloatType(), nullable=False)
+        dimensions = _embedding_dimensions_cache.get(model)
+    return ts.ArrayType((dimensions,), dtype=ts.FloatType(), nullable=False)
 #####################################
@@ -353,20 +713,18 @@ def _(model: str, dimensions: Optional[int] = None) -> pxt.ArrayType:
 @pxt.udf
-def image_generations(
-    prompt: str,
-    *,
-    model: Optional[str] = None,
-    quality: Optional[str] = None,
-    size: Optional[str] = None,
-    style: Optional[str] = None,
-    user: Optional[str] = None,
+async def image_generations(
+    prompt: str, *, model: str = 'dall-e-2', model_kwargs: dict[str, Any] | None = None
 ) -> PIL.Image.Image:
     """
     Creates an image given a prompt.
     Equivalent to the OpenAI `images/generations` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/images](https://platform.openai.com/docs/guides/images)
+    For additional details, see: <https://platform.openai.com/docs/guides/images>
+    Request throttling:
+    Applies the rate limit set in the config (section `openai.rate_limits`; use the model id as the key). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -375,8 +733,8 @@ def image_generations(
     Args:
         prompt: Prompt for the image.
         model: The model to use for the generations.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/images/create](https://platform.openai.com/docs/api-reference/images/create)
+        model_kwargs: Additional keyword args for the OpenAI `images/generations` API. For details on the available
+            parameters, see: <https://platform.openai.com/docs/api-reference/images/create>
     Returns:
         The generated image.
@@ -385,17 +743,14 @@ def image_generations(
         Add a computed column that applies the model `dall-e-2` to an existing
         Pixeltable column `tbl.text` of the table `tbl`:
-        >>> tbl['gen_image'] = image_generations(tbl.text, model='dall-e-2')
+        >>> tbl.add_computed_column(gen_image=image_generations(tbl.text, model='dall-e-2'))
     """
+    if model_kwargs is None:
+        model_kwargs = {}
     # TODO(aaron-siegel): Decompose CPU/GPU ops into separate functions
-    result = _retry(_openai_client().images.generate)(
-        prompt=prompt,
-        model=_opt(model),
-        quality=_opt(quality),
-        size=_opt(size),
-        style=_opt(style),
-        user=_opt(user),
-        response_format='b64_json',
+    result = await _openai_client().images.generate(
+        prompt=prompt, model=model, response_format='b64_json', **model_kwargs
     )
     b64_str = result.data[0].b64_json
     b64_bytes = base64.b64decode(b64_str)
@@ -405,17 +760,19 @@ def image_generations(
 @image_generations.conditional_return_type
-def _(size: Optional[str] = None) -> pxt.ImageType:
-    if size is None:
-        return pxt.ImageType(size=(1024, 1024))
+def _(model_kwargs: dict[str, Any] | None = None) -> ts.ImageType:
+    if model_kwargs is None or 'size' not in model_kwargs:
+        # default size is 1024x1024
+        return ts.ImageType(size=(1024, 1024))
+    size = model_kwargs['size']
     x_pos = size.find('x')
     if x_pos == -1:
-        return pxt.ImageType()
+        return ts.ImageType()
     try:
         width, height = int(size[:x_pos]), int(size[x_pos + 1 :])
     except ValueError:
-        return pxt.ImageType()
-    return pxt.ImageType(size=(width, height))
+        return ts.ImageType()
+    return ts.ImageType(size=(width, height))
 #####################################
@@ -423,12 +780,16 @@ def _(size: Optional[str] = None) -> pxt.ImageType:
 @pxt.udf
-def moderations(input: str, *, model: Optional[str] = None) -> dict:
+async def moderations(input: str, *, model: str = 'omni-moderation-latest') -> dict:
     """
     Classifies if text is potentially harmful.
     Equivalent to the OpenAI `moderations` API endpoint.
-    For additional details, see: [https://platform.openai.com/docs/guides/moderation](https://platform.openai.com/docs/guides/moderation)
+    For additional details, see: <https://platform.openai.com/docs/guides/moderation>
+    Request throttling:
+    Applies the rate limit set in the config (section `openai.rate_limits`; use the model id as the key). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -438,7 +799,7 @@ def moderations(input: str, *, model: Optional[str] = None) -> dict:
         input: Text to analyze with the moderations model.
         model: The model to use for moderations.
-    For details on the other parameters, see: [https://platform.openai.com/docs/api-reference/moderations](https://platform.openai.com/docs/api-reference/moderations)
+    For details on the other parameters, see: <https://platform.openai.com/docs/api-reference/moderations>
     Returns:
         Details of the moderations results.
@@ -447,22 +808,49 @@ def moderations(input: str, *, model: Optional[str] = None) -> dict:
         Add a computed column that applies the model `text-moderation-stable` to an existing
         Pixeltable column `tbl.input` of the table `tbl`:
-        >>> tbl['moderations'] = moderations(tbl.text, model='text-moderation-stable')
+        >>> tbl.add_computed_column(moderations=moderations(tbl.text, model='text-moderation-stable'))
     """
-    result = _retry(_openai_client().moderations.create)(input=input, model=_opt(model))
+    result = await _openai_client().moderations.create(input=input, model=model)
     return result.dict()
-_T = TypeVar('_T')
+@speech.resource_pool
+@transcriptions.resource_pool
+@translations.resource_pool
+@image_generations.resource_pool
+@moderations.resource_pool
+def _(model: str) -> str:
+    return f'request-rate:openai:{model}'
-def _opt(arg: _T) -> Union[_T, 'openai.NotGiven']:
-    import openai
-    return arg if arg is not None else openai.NOT_GIVEN
+@chat_completions.resource_pool
+@vision.resource_pool
+@embeddings.resource_pool
+def _(model: str) -> str:
+    return _rate_limits_pool(model)
+def invoke_tools(tools: Tools, response: exprs.Expr) -> exprs.InlineDict:
+    """Converts an OpenAI response dict to Pixeltable tool invocation format and calls `tools._invoke()`."""
+    return tools._invoke(_openai_response_to_pxt_tool_calls(response))
+@pxt.udf
+def _openai_response_to_pxt_tool_calls(response: dict) -> dict | None:
+    if 'tool_calls' not in response['choices'][0]['message'] or response['choices'][0]['message']['tool_calls'] is None:
+        return None
+    openai_tool_calls = response['choices'][0]['message']['tool_calls']
+    pxt_tool_calls: dict[str, list[dict[str, Any]]] = {}
+    for tool_call in openai_tool_calls:
+        tool_name = tool_call['function']['name']
+        if tool_name not in pxt_tool_calls:
+            pxt_tool_calls[tool_name] = []
+        pxt_tool_calls[tool_name].append({'args': json.loads(tool_call['function']['arguments'])})
+    return pxt_tool_calls
 __all__ = local_public_names(__name__)
-def __dir__():
+def __dir__() -> list[str]:
     return __all__

pixeltable 0.2.26__py3-none-any.whl → 0.5.7__py3-none-any.whl

pixeltable 0.2.26py3-none-any.whl → 0.5.7py3-none-any.whl