PyPI - pixeltable - Versions diffs - 0.2.26__py3-none-any.whl → 0.5.7__py3-none-any.whl - Mend

pixeltable 0.2.26py3-none-any.whl → 0.5.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (245) hide show

pixeltable/__init__.py +83 -19
pixeltable/_query.py +1444 -0
pixeltable/_version.py +1 -0
pixeltable/catalog/__init__.py +7 -4
pixeltable/catalog/catalog.py +2394 -119
pixeltable/catalog/column.py +225 -104
pixeltable/catalog/dir.py +38 -9
pixeltable/catalog/globals.py +53 -34
pixeltable/catalog/insertable_table.py +265 -115
pixeltable/catalog/path.py +80 -17
pixeltable/catalog/schema_object.py +28 -43
pixeltable/catalog/table.py +1270 -677
pixeltable/catalog/table_metadata.py +103 -0
pixeltable/catalog/table_version.py +1270 -751
pixeltable/catalog/table_version_handle.py +109 -0
pixeltable/catalog/table_version_path.py +137 -42
pixeltable/catalog/tbl_ops.py +53 -0
pixeltable/catalog/update_status.py +191 -0
pixeltable/catalog/view.py +251 -134
pixeltable/config.py +215 -0
pixeltable/env.py +736 -285
pixeltable/exceptions.py +26 -2
pixeltable/exec/__init__.py +7 -2
pixeltable/exec/aggregation_node.py +39 -21
pixeltable/exec/cache_prefetch_node.py +87 -109
pixeltable/exec/cell_materialization_node.py +268 -0
pixeltable/exec/cell_reconstruction_node.py +168 -0
pixeltable/exec/component_iteration_node.py +25 -28
pixeltable/exec/data_row_batch.py +11 -46
pixeltable/exec/exec_context.py +26 -11
pixeltable/exec/exec_node.py +35 -27
pixeltable/exec/expr_eval/__init__.py +3 -0
pixeltable/exec/expr_eval/evaluators.py +365 -0
pixeltable/exec/expr_eval/expr_eval_node.py +413 -0
pixeltable/exec/expr_eval/globals.py +200 -0
pixeltable/exec/expr_eval/row_buffer.py +74 -0
pixeltable/exec/expr_eval/schedulers.py +413 -0
pixeltable/exec/globals.py +35 -0
pixeltable/exec/in_memory_data_node.py +35 -27
pixeltable/exec/object_store_save_node.py +293 -0
pixeltable/exec/row_update_node.py +44 -29
pixeltable/exec/sql_node.py +414 -115
pixeltable/exprs/__init__.py +8 -5
pixeltable/exprs/arithmetic_expr.py +79 -45
pixeltable/exprs/array_slice.py +5 -5
pixeltable/exprs/column_property_ref.py +40 -26
pixeltable/exprs/column_ref.py +254 -61
pixeltable/exprs/comparison.py +14 -9
pixeltable/exprs/compound_predicate.py +9 -10
pixeltable/exprs/data_row.py +213 -72
pixeltable/exprs/expr.py +270 -104
pixeltable/exprs/expr_dict.py +6 -5
pixeltable/exprs/expr_set.py +20 -11
pixeltable/exprs/function_call.py +383 -284
pixeltable/exprs/globals.py +18 -5
pixeltable/exprs/in_predicate.py +7 -7
pixeltable/exprs/inline_expr.py +37 -37
pixeltable/exprs/is_null.py +8 -4
pixeltable/exprs/json_mapper.py +120 -54
pixeltable/exprs/json_path.py +90 -60
pixeltable/exprs/literal.py +61 -16
pixeltable/exprs/method_ref.py +7 -6
pixeltable/exprs/object_ref.py +19 -8
pixeltable/exprs/row_builder.py +238 -75
pixeltable/exprs/rowid_ref.py +53 -15
pixeltable/exprs/similarity_expr.py +65 -50
pixeltable/exprs/sql_element_cache.py +5 -5
pixeltable/exprs/string_op.py +107 -0
pixeltable/exprs/type_cast.py +25 -13
pixeltable/exprs/variable.py +2 -2
pixeltable/func/__init__.py +9 -5
pixeltable/func/aggregate_function.py +197 -92
pixeltable/func/callable_function.py +119 -35
pixeltable/func/expr_template_function.py +101 -48
pixeltable/func/function.py +375 -62
pixeltable/func/function_registry.py +20 -19
pixeltable/func/globals.py +6 -5
pixeltable/func/mcp.py +74 -0
pixeltable/func/query_template_function.py +151 -35
pixeltable/func/signature.py +178 -49
pixeltable/func/tools.py +164 -0
pixeltable/func/udf.py +176 -53
pixeltable/functions/__init__.py +44 -4
pixeltable/functions/anthropic.py +226 -47
pixeltable/functions/audio.py +148 -11
pixeltable/functions/bedrock.py +137 -0
pixeltable/functions/date.py +188 -0
pixeltable/functions/deepseek.py +113 -0
pixeltable/functions/document.py +81 -0
pixeltable/functions/fal.py +76 -0
pixeltable/functions/fireworks.py +72 -20
pixeltable/functions/gemini.py +249 -0
pixeltable/functions/globals.py +208 -53
pixeltable/functions/groq.py +108 -0
pixeltable/functions/huggingface.py +1088 -95
pixeltable/functions/image.py +155 -84
pixeltable/functions/json.py +8 -11
pixeltable/functions/llama_cpp.py +31 -19
pixeltable/functions/math.py +169 -0
pixeltable/functions/mistralai.py +50 -75
pixeltable/functions/net.py +70 -0
pixeltable/functions/ollama.py +29 -36
pixeltable/functions/openai.py +548 -160
pixeltable/functions/openrouter.py +143 -0
pixeltable/functions/replicate.py +15 -14
pixeltable/functions/reve.py +250 -0
pixeltable/functions/string.py +310 -85
pixeltable/functions/timestamp.py +37 -19
pixeltable/functions/together.py +77 -120
pixeltable/functions/twelvelabs.py +188 -0
pixeltable/functions/util.py +7 -2
pixeltable/functions/uuid.py +30 -0
pixeltable/functions/video.py +1528 -117
pixeltable/functions/vision.py +26 -26
pixeltable/functions/voyageai.py +289 -0
pixeltable/functions/whisper.py +19 -10
pixeltable/functions/whisperx.py +179 -0
pixeltable/functions/yolox.py +112 -0
pixeltable/globals.py +716 -236
pixeltable/index/__init__.py +3 -1
pixeltable/index/base.py +17 -21
pixeltable/index/btree.py +32 -22
pixeltable/index/embedding_index.py +155 -92
pixeltable/io/__init__.py +12 -7
pixeltable/io/datarows.py +140 -0
pixeltable/io/external_store.py +83 -125
pixeltable/io/fiftyone.py +24 -33
pixeltable/io/globals.py +47 -182
pixeltable/io/hf_datasets.py +96 -127
pixeltable/io/label_studio.py +171 -156
pixeltable/io/lancedb.py +3 -0
pixeltable/io/pandas.py +136 -115
pixeltable/io/parquet.py +40 -153
pixeltable/io/table_data_conduit.py +702 -0
pixeltable/io/utils.py +100 -0
pixeltable/iterators/__init__.py +8 -4
pixeltable/iterators/audio.py +207 -0
pixeltable/iterators/base.py +9 -3
pixeltable/iterators/document.py +144 -87
pixeltable/iterators/image.py +17 -38
pixeltable/iterators/string.py +15 -12
pixeltable/iterators/video.py +523 -127
pixeltable/metadata/__init__.py +33 -8
pixeltable/metadata/converters/convert_10.py +2 -3
pixeltable/metadata/converters/convert_13.py +2 -2
pixeltable/metadata/converters/convert_15.py +15 -11
pixeltable/metadata/converters/convert_16.py +4 -5
pixeltable/metadata/converters/convert_17.py +4 -5
pixeltable/metadata/converters/convert_18.py +4 -6
pixeltable/metadata/converters/convert_19.py +6 -9
pixeltable/metadata/converters/convert_20.py +3 -6
pixeltable/metadata/converters/convert_21.py +6 -8
pixeltable/metadata/converters/convert_22.py +3 -2
pixeltable/metadata/converters/convert_23.py +33 -0
pixeltable/metadata/converters/convert_24.py +55 -0
pixeltable/metadata/converters/convert_25.py +19 -0
pixeltable/metadata/converters/convert_26.py +23 -0
pixeltable/metadata/converters/convert_27.py +29 -0
pixeltable/metadata/converters/convert_28.py +13 -0
pixeltable/metadata/converters/convert_29.py +110 -0
pixeltable/metadata/converters/convert_30.py +63 -0
pixeltable/metadata/converters/convert_31.py +11 -0
pixeltable/metadata/converters/convert_32.py +15 -0
pixeltable/metadata/converters/convert_33.py +17 -0
pixeltable/metadata/converters/convert_34.py +21 -0
pixeltable/metadata/converters/convert_35.py +9 -0
pixeltable/metadata/converters/convert_36.py +38 -0
pixeltable/metadata/converters/convert_37.py +15 -0
pixeltable/metadata/converters/convert_38.py +39 -0
pixeltable/metadata/converters/convert_39.py +124 -0
pixeltable/metadata/converters/convert_40.py +73 -0
pixeltable/metadata/converters/convert_41.py +12 -0
pixeltable/metadata/converters/convert_42.py +9 -0
pixeltable/metadata/converters/convert_43.py +44 -0
pixeltable/metadata/converters/util.py +44 -18
pixeltable/metadata/notes.py +21 -0
pixeltable/metadata/schema.py +185 -42
pixeltable/metadata/utils.py +74 -0
pixeltable/mypy/__init__.py +3 -0
pixeltable/mypy/mypy_plugin.py +123 -0
pixeltable/plan.py +616 -225
pixeltable/share/__init__.py +3 -0
pixeltable/share/packager.py +797 -0
pixeltable/share/protocol/__init__.py +33 -0
pixeltable/share/protocol/common.py +165 -0
pixeltable/share/protocol/operation_types.py +33 -0
pixeltable/share/protocol/replica.py +119 -0
pixeltable/share/publish.py +349 -0
pixeltable/store.py +398 -232
pixeltable/type_system.py +730 -267
pixeltable/utils/__init__.py +40 -0
pixeltable/utils/arrow.py +201 -29
pixeltable/utils/av.py +298 -0
pixeltable/utils/azure_store.py +346 -0
pixeltable/utils/coco.py +26 -27
pixeltable/utils/code.py +4 -4
pixeltable/utils/console_output.py +46 -0
pixeltable/utils/coroutine.py +24 -0
pixeltable/utils/dbms.py +92 -0
pixeltable/utils/description_helper.py +11 -12
pixeltable/utils/documents.py +60 -61
pixeltable/utils/exception_handler.py +36 -0
pixeltable/utils/filecache.py +38 -22
pixeltable/utils/formatter.py +88 -51
pixeltable/utils/gcs_store.py +295 -0
pixeltable/utils/http.py +133 -0
pixeltable/utils/http_server.py +14 -13
pixeltable/utils/iceberg.py +13 -0
pixeltable/utils/image.py +17 -0
pixeltable/utils/lancedb.py +90 -0
pixeltable/utils/local_store.py +322 -0
pixeltable/utils/misc.py +5 -0
pixeltable/utils/object_stores.py +573 -0
pixeltable/utils/pydantic.py +60 -0
pixeltable/utils/pytorch.py +20 -20
pixeltable/utils/s3_store.py +527 -0
pixeltable/utils/sql.py +32 -5
pixeltable/utils/system.py +30 -0
pixeltable/utils/transactional_directory.py +4 -3
pixeltable-0.5.7.dist-info/METADATA +579 -0
pixeltable-0.5.7.dist-info/RECORD +227 -0
{pixeltable-0.2.26.dist-info → pixeltable-0.5.7.dist-info}/WHEEL +1 -1
pixeltable-0.5.7.dist-info/entry_points.txt +2 -0
pixeltable/__version__.py +0 -3
pixeltable/catalog/named_function.py +0 -36
pixeltable/catalog/path_dict.py +0 -141
pixeltable/dataframe.py +0 -894
pixeltable/exec/expr_eval_node.py +0 -232
pixeltable/ext/__init__.py +0 -14
pixeltable/ext/functions/__init__.py +0 -8
pixeltable/ext/functions/whisperx.py +0 -77
pixeltable/ext/functions/yolox.py +0 -157
pixeltable/tool/create_test_db_dump.py +0 -311
pixeltable/tool/create_test_video.py +0 -81
pixeltable/tool/doc_plugins/griffe.py +0 -50
pixeltable/tool/doc_plugins/mkdocstrings.py +0 -6
pixeltable/tool/doc_plugins/templates/material/udf.html.jinja +0 -135
pixeltable/tool/embed_udf.py +0 -9
pixeltable/tool/mypy_plugin.py +0 -55
pixeltable/utils/media_store.py +0 -76
pixeltable/utils/s3.py +0 -16
pixeltable-0.2.26.dist-info/METADATA +0 -400
pixeltable-0.2.26.dist-info/RECORD +0 -156
pixeltable-0.2.26.dist-info/entry_points.txt +0 -3
{pixeltable-0.2.26.dist-info → pixeltable-0.5.7.dist-info/licenses}/LICENSE +0 -0

pixeltable/functions/timestamp.py CHANGED Viewed

@@ -1,5 +1,5 @@
 """
-Pixeltable [UDFs](https://pixeltable.readme.io/docs/user-defined-functions-udfs) for `TimestampType`.
+Pixeltable UDFs for `TimestampType`.
 Usage example:
 ```python
@@ -11,7 +11,6 @@ t.select(t.timestamp_col.year, t.timestamp_col.weekday()).collect()
 """
 from datetime import datetime
-from typing import Optional
 import sqlalchemy as sql
@@ -19,6 +18,8 @@ import pixeltable as pxt
 from pixeltable.env import Env
 from pixeltable.utils.code import local_public_names
+_SQL_ZERO = sql.literal(0)
 @pxt.udf(is_property=True)
 def year(self: datetime) -> int:
@@ -132,9 +133,11 @@ def astimezone(self: datetime, tz: str) -> datetime:
     Convert the datetime to the given time zone.
     Args:
-        tz: The time zone to convert to. Must be a valid time zone name from the IANA Time Zone Database.
+        tz: The time zone to convert to. Must be a valid time zone name from the
+            [IANA Time Zone Database](https://en.wikipedia.org/wiki/List_of_tz_database_time_zones).
     """
     from zoneinfo import ZoneInfo
     tzinfo = ZoneInfo(tz)
     return self.astimezone(tzinfo)
@@ -190,7 +193,9 @@ def isoformat(self: datetime, sep: str = 'T', timespec: str = 'auto') -> str:
     Args:
         sep: Separator between date and time.
-        timespec: The number of additional terms in the output. See the [`datetime.isoformat()`](https://docs.python.org/3/library/datetime.html#datetime.datetime.isoformat) documentation for more details.
+        timespec: The number of additional terms in the output. See the
+            [`datetime.isoformat()`](https://docs.python.org/3/library/datetime.html#datetime.datetime.isoformat)
+            documentation for more details.
     """
     return self.isoformat(sep=sep, timespec=timespec)
@@ -203,14 +208,15 @@ def strftime(self: datetime, format: str) -> str:
     Equivalent to [`datetime.strftime()`](https://docs.python.org/3/library/datetime.html#datetime.datetime.strftime).
     Args:
-        format: The format string to control the output. For a complete list of formatting directives, see [`strftime()` and `strptime()` Behavior](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior).
+        format: The format string to control the output. For a complete list of formatting directives, see
+            [`strftime()` and `strptime()` Behavior](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior).
     """
     return self.strftime(format)
 @pxt.udf(is_method=True)
 def make_timestamp(
-        year: int, month: int, day: int, hour: int = 0, minute: int = 0, second: int = 0, microsecond: int = 0
+    year: int, month: int, day: int, hour: int = 0, minute: int = 0, second: int = 0, microsecond: int = 0
 ) -> datetime:
     """
     Create a timestamp.
@@ -222,17 +228,23 @@ def make_timestamp(
 @make_timestamp.to_sql
 def _(
-        year: sql.ColumnElement, month: sql.ColumnElement, day: sql.ColumnElement,
-        hour: sql.ColumnElement = sql.literal(0), minute: sql.ColumnElement = sql.literal(0),
-        second: sql.ColumnElement = sql.literal(0), microsecond: sql.ColumnElement = sql.literal(0)
+    year: sql.ColumnElement,
+    month: sql.ColumnElement,
+    day: sql.ColumnElement,
+    hour: sql.ColumnElement = _SQL_ZERO,
+    minute: sql.ColumnElement = _SQL_ZERO,
+    second: sql.ColumnElement = _SQL_ZERO,
+    microsecond: sql.ColumnElement = _SQL_ZERO,
 ) -> sql.ColumnElement:
     return sql.func.make_timestamptz(
-        sql.cast(year, sql.Integer),
-        sql.cast(month, sql.Integer),
-        sql.cast(day, sql.Integer),
-        sql.cast(hour, sql.Integer),
-        sql.cast(minute, sql.Integer),
-        sql.cast(second + microsecond / 1000000.0, sql.Double))
+        year.cast(sql.Integer),
+        month.cast(sql.Integer),
+        day.cast(sql.Integer),
+        hour.cast(sql.Integer),
+        minute.cast(sql.Integer),
+        (second + microsecond / 1000000.0).cast(sql.Float),
+    )
 # @pxt.udf
 # def date(self: datetime) -> datetime:
@@ -258,9 +270,15 @@ def _(
 @pxt.udf(is_method=True)
 def replace(
-        self: datetime, year: Optional[int] = None, month: Optional[int] = None, day: Optional[int] = None,
-        hour: Optional[int] = None, minute: Optional[int] = None, second: Optional[int] = None,
-        microsecond: Optional[int] = None) -> datetime:
+    self: datetime,
+    year: int | None = None,
+    month: int | None = None,
+    day: int | None = None,
+    hour: int | None = None,
+    minute: int | None = None,
+    second: int | None = None,
+    microsecond: int | None = None,
+) -> datetime:
     """
     Return a datetime with the same attributes, except for those attributes given new values by whichever keyword
     arguments are specified.
@@ -294,5 +312,5 @@ def posix_timestamp(self: datetime) -> float:
 __all__ = local_public_names(__name__)
-def __dir__():
+def __dir__() -> list[str]:
     return __all__

pixeltable/functions/together.py CHANGED Viewed

@@ -1,13 +1,13 @@
 """
-Pixeltable [UDFs](https://pixeltable.readme.io/docs/user-defined-functions-udfs)
+Pixeltable UDFs
 that wrap various endpoints from the Together AI API. In order to use them, you must
 first `pip install together` and configure your Together AI credentials, as described in
-the [Working with Together AI](https://pixeltable.readme.io/docs/together-ai) tutorial.
+the [Working with Together AI](https://docs.pixeltable.com/notebooks/integrations/working-with-together-ai) tutorial.
 """
 import base64
 import io
-from typing import TYPE_CHECKING, Callable, Optional, TypeVar
+from typing import TYPE_CHECKING, Any, Callable, TypeVar
 import numpy as np
 import PIL.Image
@@ -16,6 +16,7 @@ import tenacity
 import pixeltable as pxt
 import pixeltable.exceptions as excs
+import pixeltable.type_system as ts
 from pixeltable import env
 from pixeltable.func import Batch
 from pixeltable.utils.code import local_public_names
@@ -25,12 +26,13 @@ if TYPE_CHECKING:
 @env.register_client('together')
-def _(api_key: str) -> 'together.Together':
+def _(api_key: str) -> 'together.AsyncTogether':
     import together
-    return together.Together(api_key=api_key)
+    return together.AsyncTogether(api_key=api_key)
-def _together_client() -> 'together.Together':
+def _together_client() -> 'together.AsyncTogether':
     return env.Env.get().get_client('together')
@@ -39,6 +41,7 @@ T = TypeVar('T')
 def _retry(fn: Callable[..., T]) -> Callable[..., T]:
     import together
     return tenacity.retry(
         retry=tenacity.retry_if_exception_type(together.error.RateLimitError),
         wait=tenacity.wait_random_exponential(multiplier=1, max=60),
@@ -46,27 +49,17 @@ def _retry(fn: Callable[..., T]) -> Callable[..., T]:
     )(fn)
-@pxt.udf
-def completions(
-    prompt: str,
-    *,
-    model: str,
-    max_tokens: Optional[int] = None,
-    stop: Optional[list] = None,
-    temperature: Optional[float] = None,
-    top_p: Optional[float] = None,
-    top_k: Optional[int] = None,
-    repetition_penalty: Optional[float] = None,
-    logprobs: Optional[int] = None,
-    echo: Optional[bool] = None,
-    n: Optional[int] = None,
-    safety_model: Optional[str] = None,
-) -> dict:
+@pxt.udf(resource_pool='request-rate:together:chat')
+async def completions(prompt: str, *, model: str, model_kwargs: dict[str, Any] | None = None) -> dict:
     """
     Generate completions based on a given prompt using a specified model.
     Equivalent to the Together AI `completions` API endpoint.
-    For additional details, see: [https://docs.together.ai/reference/completions-1](https://docs.together.ai/reference/completions-1)
+    For additional details, see: <https://docs.together.ai/reference/completions-1>
+    Request throttling:
+    Applies the rate limit set in the config (section `together.rate_limits`, key `chat`). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -75,61 +68,38 @@ def completions(
     Args:
         prompt: A string providing context for the model to complete.
         model: The name of the model to query.
-    For details on the other parameters, see: [https://docs.together.ai/reference/completions-1](https://docs.together.ai/reference/completions-1)
+        model_kwargs: Additional keyword arguments for the Together `completions` API.
+            For details on the available parameters, see: <https://docs.together.ai/reference/completions-1>
     Returns:
         A dictionary containing the response and other metadata.
     Examples:
-        Add a computed column that applies the model `mistralai/Mixtral-8x7B-v0.1` to an existing Pixeltable column `tbl.prompt`
-        of the table `tbl`:
+        Add a computed column that applies the model `mistralai/Mixtral-8x7B-v0.1` to an existing Pixeltable column
+        `tbl.prompt` of the table `tbl`:
-        >>> tbl['response'] = completions(tbl.prompt, model='mistralai/Mixtral-8x7B-v0.1')
+        >>> tbl.add_computed_column(response=completions(tbl.prompt, model='mistralai/Mixtral-8x7B-v0.1'))
     """
-    return (
-        _retry(_together_client().completions.create)(
-            prompt=prompt,
-            model=model,
-            max_tokens=max_tokens,
-            stop=stop,
-            temperature=temperature,
-            top_p=top_p,
-            top_k=top_k,
-            repetition_penalty=repetition_penalty,
-            logprobs=logprobs,
-            echo=echo,
-            n=n,
-            safety_model=safety_model,
-        )
-        .dict()
-    )
-@pxt.udf
-def chat_completions(
-    messages: list[dict[str, str]],
-    *,
-    model: str,
-    max_tokens: Optional[int] = None,
-    stop: Optional[list[str]] = None,
-    temperature: Optional[float] = None,
-    top_p: Optional[float] = None,
-    top_k: Optional[int] = None,
-    repetition_penalty: Optional[float] = None,
-    logprobs: Optional[int] = None,
-    echo: Optional[bool] = None,
-    n: Optional[int] = None,
-    safety_model: Optional[str] = None,
-    response_format: Optional[dict] = None,
-    tools: Optional[dict] = None,
-    tool_choice: Optional[dict] = None,
+    if model_kwargs is None:
+        model_kwargs = {}
+    result = await _together_client().completions.create(prompt=prompt, model=model, **model_kwargs)
+    return result.dict()
+@pxt.udf(resource_pool='request-rate:together:chat')
+async def chat_completions(
+    messages: list[dict[str, str]], *, model: str, model_kwargs: dict[str, Any] | None = None
 ) -> dict:
     """
     Generate chat completions based on a given prompt using a specified model.
     Equivalent to the Together AI `chat/completions` API endpoint.
-    For additional details, see: [https://docs.together.ai/reference/chat-completions-1](https://docs.together.ai/reference/chat-completions-1)
+    For additional details, see: <https://docs.together.ai/reference/chat-completions-1>
+    Request throttling:
+    Applies the rate limit set in the config (section `together.rate_limits`, key `chat`). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -138,39 +108,24 @@ def chat_completions(
     Args:
         messages: A list of messages comprising the conversation so far.
         model: The name of the model to query.
-    For details on the other parameters, see: [https://docs.together.ai/reference/chat-completions-1](https://docs.together.ai/reference/chat-completions-1)
+        model_kwargs: Additional keyword arguments for the Together `chat/completions` API.
+            For details on the available parameters, see: <https://docs.together.ai/reference/chat-completions-1>
     Returns:
         A dictionary containing the response and other metadata.
     Examples:
-        Add a computed column that applies the model `mistralai/Mixtral-8x7B-v0.1` to an existing Pixeltable column `tbl.prompt`
-        of the table `tbl`:
+        Add a computed column that applies the model `mistralai/Mixtral-8x7B-v0.1` to an existing Pixeltable column
+        `tbl.prompt` of the table `tbl`:
         >>> messages = [{'role': 'user', 'content': tbl.prompt}]
-        ... tbl['response'] = chat_completions(messages, model='mistralai/Mixtral-8x7B-v0.1')
+        ... tbl.add_computed_column(response=chat_completions(messages, model='mistralai/Mixtral-8x7B-v0.1'))
     """
-    return (
-        _retry(_together_client().chat.completions.create)(
-            messages=messages,
-            model=model,
-            max_tokens=max_tokens,
-            stop=stop,
-            temperature=temperature,
-            top_p=top_p,
-            top_k=top_k,
-            repetition_penalty=repetition_penalty,
-            logprobs=logprobs,
-            echo=echo,
-            n=n,
-            safety_model=safety_model,
-            response_format=response_format,
-            tools=tools,
-            tool_choice=tool_choice,
-        )
-        .dict()
-    )
+    if model_kwargs is None:
+        model_kwargs = {}
+    result = await _together_client().chat.completions.create(messages=messages, model=model, **model_kwargs)
+    return result.dict()
 _embedding_dimensions_cache = {
@@ -185,13 +140,17 @@ _embedding_dimensions_cache = {
 }
-@pxt.udf(batch_size=32)
-def embeddings(input: Batch[str], *, model: str) -> Batch[pxt.Array[(None,), pxt.Float]]:
+@pxt.udf(batch_size=32, resource_pool='request-rate:together:embeddings')
+async def embeddings(input: Batch[str], *, model: str) -> Batch[pxt.Array[(None,), pxt.Float]]:
     """
     Query an embedding model for a given string of text.
     Equivalent to the Together AI `embeddings` API endpoint.
-    For additional details, see: [https://docs.together.ai/reference/embeddings-2](https://docs.together.ai/reference/embeddings-2)
+    For additional details, see: <https://docs.together.ai/reference/embeddings-2>
+    Request throttling:
+    Applies the rate limit set in the config (section `together.rate_limits`, key `embeddings`). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -208,37 +167,32 @@ def embeddings(input: Batch[str], *, model: str) -> Batch[pxt.Array[(None,), pxt
         Add a computed column that applies the model `togethercomputer/m2-bert-80M-8k-retrieval`
         to an existing Pixeltable column `tbl.text` of the table `tbl`:
-        >>> tbl['response'] = embeddings(tbl.text, model='togethercomputer/m2-bert-80M-8k-retrieval')
+        >>> tbl.add_computed_column(response=embeddings(tbl.text, model='togethercomputer/m2-bert-80M-8k-retrieval'))
     """
-    result = _retry(_together_client().embeddings.create)(input=input, model=model)
+    result = await _together_client().embeddings.create(input=input, model=model)
     return [np.array(data.embedding, dtype=np.float64) for data in result.data]
 @embeddings.conditional_return_type
-def _(model: str) -> pxt.ArrayType:
+def _(model: str) -> ts.ArrayType:
     if model not in _embedding_dimensions_cache:
         # TODO: find some other way to retrieve a sample
-        return pxt.ArrayType((None,), dtype=pxt.FloatType())
+        return ts.ArrayType((None,), dtype=ts.FloatType())
     dimensions = _embedding_dimensions_cache[model]
-    return pxt.ArrayType((dimensions,), dtype=pxt.FloatType())
-@pxt.udf
-def image_generations(
-    prompt: str,
-    *,
-    model: str,
-    steps: Optional[int] = None,
-    seed: Optional[int] = None,
-    height: Optional[int] = None,
-    width: Optional[int] = None,
-    negative_prompt: Optional[str] = None,
-) -> PIL.Image.Image:
+    return ts.ArrayType((dimensions,), dtype=ts.FloatType())
+@pxt.udf(resource_pool='request-rate:together:images')
+async def image_generations(prompt: str, *, model: str, model_kwargs: dict[str, Any] | None = None) -> PIL.Image.Image:
     """
     Generate images based on a given prompt using a specified model.
     Equivalent to the Together AI `images/generations` API endpoint.
-    For additional details, see: [https://docs.together.ai/reference/post_images-generations](https://docs.together.ai/reference/post_images-generations)
+    For additional details, see: <https://docs.together.ai/reference/post_images-generations>
+    Request throttling:
+    Applies the rate limit set in the config (section `together.rate_limits`, key `images`). If no rate
+    limit is configured, uses a default of 600 RPM.
     __Requirements:__
@@ -247,8 +201,8 @@ def image_generations(
     Args:
         prompt: A description of the desired images.
         model: The model to use for image generation.
-    For details on the other parameters, see: [https://docs.together.ai/reference/post_images-generations](https://docs.together.ai/reference/post_images-generations)
+        model_kwargs: Additional keyword args for the Together `images/generations` API.
+            For details on the available parameters, see: <https://docs.together.ai/reference/post_images-generations>
     Returns:
         The generated image.
@@ -257,11 +211,14 @@ def image_generations(
         Add a computed column that applies the model `stabilityai/stable-diffusion-xl-base-1.0`
         to an existing Pixeltable column `tbl.prompt` of the table `tbl`:
-        >>> tbl['response'] = image_generations(tbl.prompt, model='stabilityai/stable-diffusion-xl-base-1.0')
+        >>> tbl.add_computed_column(
+        ...     response=image_generations(tbl.prompt, model='stabilityai/stable-diffusion-xl-base-1.0')
+        ... )
     """
-    result = _retry(_together_client().images.generate)(
-        prompt=prompt, model=model, steps=steps, seed=seed, height=height, width=width, negative_prompt=negative_prompt
-    )
+    if model_kwargs is None:
+        model_kwargs = {}
+    result = await _together_client().images.generate(prompt=prompt, model=model, **model_kwargs)
     if result.data[0].b64_json is not None:
         b64_bytes = base64.b64decode(result.data[0].b64_json)
         img = PIL.Image.open(io.BytesIO(b64_bytes))
@@ -282,5 +239,5 @@ def image_generations(
 __all__ = local_public_names(__name__)
-def __dir__():
+def __dir__() -> list[str]:
     return __all__

pixeltable/functions/twelvelabs.py ADDED Viewed

@@ -0,0 +1,188 @@
+"""
+Pixeltable UDFs
+that wrap various endpoints from the TwelveLabs API. In order to use them, you must
+first `pip install twelvelabs` and configure your TwelveLabs credentials, as described in
+the [Working with TwelveLabs](https://docs.pixeltable.com/notebooks/integrations/working-with-twelvelabs) tutorial.
+"""
+from base64 import b64encode
+from typing import TYPE_CHECKING, Literal
+import numpy as np
+import pixeltable as pxt
+from pixeltable import env, type_system as ts
+from pixeltable.utils.code import local_public_names
+from pixeltable.utils.image import to_base64
+if TYPE_CHECKING:
+    from twelvelabs import AsyncTwelveLabs
+@env.register_client('twelvelabs')
+def _(api_key: str) -> 'AsyncTwelveLabs':
+    from twelvelabs import AsyncTwelveLabs
+    return AsyncTwelveLabs(api_key=api_key)
+def _twelvelabs_client() -> 'AsyncTwelveLabs':
+    return env.Env.get().get_client('twelvelabs')
+@pxt.udf(resource_pool='request-rate:twelvelabs')
+async def embed(text: str, image: pxt.Image | None = None, *, model_name: str) -> pxt.Array[np.float32] | None:
+    """
+    Creates an embedding vector for the given text, audio, image, or video input.
+    Each UDF signature corresponds to one of the four supported input types. If text is specified, it is possible to
+    specify an image as well, corresponding to the `text_image` embedding type in the TwelveLabs API. This is
+    (currently) the only way to include more than one input type at a time.
+    Equivalent to the TwelveLabs Embed API:
+    <https://docs.twelvelabs.io/v1.3/docs/guides/create-embeddings>
+    Request throttling:
+    Applies the rate limit set in the config (section `twelvelabs`, key `rate_limit`). If no rate
+    limit is configured, uses a default of 600 RPM.
+    __Requirements:__
+    - `pip install twelvelabs`
+    Args:
+        model_name: The name of the model to use. Check
+            [the TwelveLabs documentation](https://docs.twelvelabs.io/v1.3/sdk-reference/python/create-text-image-and-audio-embeddings)
+            for available models.
+        text: The text to embed.
+        image: If specified, the embedding will be created from both the text and the image.
+    Returns:
+        The embedding.
+    Examples:
+        Add a computed column `embed` for an embedding of a string column `input`:
+        >>> tbl.add_computed_column(
+        ...     embed=embed(model_name='marengo3.0', text=tbl.input)
+        ... )
+    """
+    env.Env.get().require_package('twelvelabs')
+    import twelvelabs
+    cl = _twelvelabs_client()
+    res: twelvelabs.EmbeddingSuccessResponse
+    if image is None:
+        # Text-only
+        res = await cl.embed.v_2.create(
+            input_type='text', model_name=model_name, text=twelvelabs.TextInputRequest(input_text=text)
+        )
+    else:
+        b64str = to_base64(image, format=('png' if image.has_transparency_data else 'jpeg'))
+        res = await cl.embed.v_2.create(
+            input_type='text_image',
+            model_name=model_name,
+            text_image=twelvelabs.TextImageInputRequest(
+                media_source=twelvelabs.MediaSource(base_64_string=b64str), input_text=text
+            ),
+        )
+    if not res.data:
+        raise pxt.Error(f"Didn't receive embedding for text: {text}\n{res}")
+    vector = res.data[0].embedding
+    return np.array(vector, dtype='float32')
+@embed.overload
+async def _(image: pxt.Image, *, model_name: str) -> pxt.Array[np.float32] | None:
+    env.Env.get().require_package('twelvelabs')
+    import twelvelabs
+    cl = _twelvelabs_client()
+    b64_str = to_base64(image, format=('png' if image.has_transparency_data else 'jpeg'))
+    res = await cl.embed.v_2.create(
+        input_type='image',
+        model_name=model_name,
+        image=twelvelabs.ImageInputRequest(media_source=twelvelabs.MediaSource(base_64_string=b64_str)),
+    )
+    if not res.data:
+        raise pxt.Error(f"Didn't receive embedding for image: {image}\n{res}")
+    vector = res.data[0].embedding
+    return np.array(vector, dtype='float32')
+@embed.overload
+async def _(
+    audio: pxt.Audio,
+    *,
+    model_name: str,
+    start_sec: float | None = None,
+    end_sec: float | None = None,
+    embedding_option: list[Literal['audio', 'transcription']] | None = None,
+) -> pxt.Array[np.float32] | None:
+    env.Env.get().require_package('twelvelabs')
+    import twelvelabs
+    cl = _twelvelabs_client()
+    with open(audio, 'rb') as fp:
+        b64_str = b64encode(fp.read()).decode('utf-8')
+        res = await cl.embed.v_2.create(
+            input_type='audio',
+            model_name=model_name,
+            audio=twelvelabs.AudioInputRequest(
+                media_source=twelvelabs.MediaSource(base_64_string=b64_str),
+                start_sec=start_sec,
+                end_sec=end_sec,
+                embedding_option=embedding_option,
+            ),
+        )
+        if not res.data:
+            raise pxt.Error(f"Didn't receive embedding for audio: {audio}\n{res}")
+        vector = res.data[0].embedding
+        return np.array(vector, dtype='float32')
+@embed.overload
+async def _(
+    video: pxt.Video,
+    *,
+    model_name: str,
+    start_sec: float | None = None,
+    end_sec: float | None = None,
+    embedding_option: list[Literal['visual', 'audio', 'transcription']] | None = None,
+) -> pxt.Array[np.float32] | None:
+    env.Env.get().require_package('twelvelabs')
+    import twelvelabs
+    cl = _twelvelabs_client()
+    with open(video, 'rb') as fp:
+        b64_str = b64encode(fp.read()).decode('utf-8')
+        res = await cl.embed.v_2.create(
+            input_type='video',
+            model_name=model_name,
+            video=twelvelabs.VideoInputRequest(
+                media_source=twelvelabs.MediaSource(base_64_string=b64_str),
+                start_sec=start_sec,
+                end_sec=end_sec,
+                embedding_option=embedding_option,
+            ),
+        )
+        if not res.data:
+            raise pxt.Error(f"Didn't receive embedding for video: {video}\n{res}")
+        vector = res.data[0].embedding
+        return np.array(vector, dtype='float32')
+@embed.conditional_return_type
+def _(model_name: str) -> ts.ArrayType:
+    if model_name == 'Marengo-retrieval-2.7':
+        return ts.ArrayType(shape=(1024,), dtype=np.dtype('float32'))
+    if model_name == 'marengo3.0':
+        return ts.ArrayType(shape=(512,), dtype=np.dtype('float32'))
+    return ts.ArrayType(dtype=np.dtype('float32'))
+__all__ = local_public_names(__name__)
+def __dir__() -> list[str]:
+    return __all__

pixeltable/functions/util.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import PIL.Image
+from pixeltable.config import Config
 from pixeltable.env import Env
@@ -7,10 +8,14 @@ def resolve_torch_device(device: str, allow_mps: bool = True) -> str:
     Env.get().require_package('torch')
     import torch
+    mps_enabled = Config.get().get_bool_value('enable_mps')
+    if mps_enabled is None:
+        mps_enabled = True  # Default to True if not set in config
     if device == 'auto':
         if torch.cuda.is_available():
             return 'cuda'
-        if allow_mps and torch.backends.mps.is_available():
+        if mps_enabled and allow_mps and torch.backends.mps.is_available():
             return 'mps'
         return 'cpu'
     return device
@@ -21,7 +26,7 @@ def normalize_image_mode(image: PIL.Image.Image) -> PIL.Image.Image:
     Converts grayscale images to 3-channel for compatibility with models that only work with
     multichannel input.
     """
-    if image.mode == '1' or image.mode == 'L':
+    if image.mode in ('1', 'L'):
         return image.convert('RGB')
     if image.mode == 'LA':
         return image.convert('RGBA')

pixeltable 0.2.26__py3-none-any.whl → 0.5.7__py3-none-any.whl

pixeltable 0.2.26py3-none-any.whl → 0.5.7py3-none-any.whl