PyPI - together - Versions diffs - 1.4.5__tar.gz → 1.4.6__tar.gz - Mend

together 1.4.5tar.gz → 1.4.6tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (65) hide show

{together-1.4.5 → together-1.4.6}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: together
-Version: 1.4.5
+Version: 1.4.6
 Summary: Python client for Together's Cloud Platform!
 License: Apache-2.0
 Author: Together AI

{together-1.4.5 → together-1.4.6}/pyproject.toml RENAMED Viewed

@@ -12,7 +12,7 @@ build-backend = "poetry.masonry.api"
 [tool.poetry]
 name = "together"
-version = "1.4.5"
+version = "1.4.6"
 authors = [
     "Together AI <support@together.ai>"
 ]

{together-1.4.5 → together-1.4.6}/src/together/cli/api/endpoints.py RENAMED Viewed

@@ -127,6 +127,11 @@ def endpoints(ctx: click.Context) -> None:
     is_flag=True,
     help="Create the endpoint in STOPPED state instead of auto-starting it",
 )
+@click.option(
+    "--inactive-timeout",
+    type=int,
+    help="Number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable.",
+)
 @click.option(
     "--wait",
     is_flag=True,
@@ -146,6 +151,7 @@ def create(
     no_prompt_cache: bool,
     no_speculative_decoding: bool,
     no_auto_start: bool,
+    inactive_timeout: int | None,
     wait: bool,
 ) -> None:
     """Create a new dedicated inference endpoint."""
@@ -170,6 +176,7 @@ def create(
             disable_prompt_cache=no_prompt_cache,
             disable_speculative_decoding=no_speculative_decoding,
             state="STOPPED" if no_auto_start else "STARTED",
+            inactive_timeout=inactive_timeout,
         )
     except InvalidRequestError as e:
         print_api_error(e)
@@ -194,6 +201,8 @@ def create(
         click.echo("  Speculative decoding: disabled", err=True)
     if no_auto_start:
         click.echo("  Auto-start: disabled", err=True)
+    if inactive_timeout is not None:
+        click.echo(f"  Inactive timeout: {inactive_timeout} minutes", err=True)
     click.echo(f"Endpoint created successfully, id: {response.id}", err=True)
@@ -371,6 +380,11 @@ def list(
     type=int,
     help="New maximum number of replicas to scale up to",
 )
+@click.option(
+    "--inactive-timeout",
+    type=int,
+    help="Number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable.",
+)
 @click.pass_obj
 @handle_api_errors
 def update(
@@ -379,9 +393,10 @@ def update(
     display_name: str | None,
     min_replicas: int | None,
     max_replicas: int | None,
+    inactive_timeout: int | None,
 ) -> None:
     """Update a dedicated inference endpoint's configuration."""
-    if not any([display_name, min_replicas, max_replicas]):
+    if not any([display_name, min_replicas, max_replicas, inactive_timeout]):
         click.echo("Error: At least one update option must be specified", err=True)
         sys.exit(1)
@@ -400,6 +415,8 @@ def update(
     if min_replicas is not None and max_replicas is not None:
         kwargs["min_replicas"] = min_replicas
         kwargs["max_replicas"] = max_replicas
+    if inactive_timeout is not None:
+        kwargs["inactive_timeout"] = inactive_timeout
     _response = client.endpoints.update(endpoint_id, **kwargs)
@@ -410,6 +427,8 @@ def update(
     if min_replicas is not None and max_replicas is not None:
         click.echo(f"  Min replicas: {min_replicas}", err=True)
         click.echo(f"  Max replicas: {max_replicas}", err=True)
+    if inactive_timeout is not None:
+        click.echo(f"  Inactive timeout: {inactive_timeout} minutes", err=True)
     click.echo("Successfully updated endpoint", err=True)
     click.echo(endpoint_id)

{together-1.4.5 → together-1.4.6}/src/together/cli/api/models.py RENAMED Viewed

@@ -1,4 +1,4 @@
-from textwrap import wrap
+import json as json_lib
 import click
 from tabulate import tabulate
@@ -15,12 +15,22 @@ def models(ctx: click.Context) -> None:
 @models.command()
+@click.option(
+    "--type",
+    type=click.Choice(["dedicated"]),
+    help="Filter models by type (dedicated: models that can be deployed as dedicated endpoints)",
+)
+@click.option(
+    "--json",
+    is_flag=True,
+    help="Output in JSON format",
+)
 @click.pass_context
-def list(ctx: click.Context) -> None:
+def list(ctx: click.Context, type: str | None, json: bool) -> None:
     """List models"""
     client: Together = ctx.obj
-    response = client.models.list()
+    response = client.models.list(dedicated=(type == "dedicated"))
     display_list = []
@@ -28,15 +38,18 @@ def list(ctx: click.Context) -> None:
     for model in response:
         display_list.append(
             {
-                "ID": "\n".join(wrap(model.id or "", width=30)),
-                "Name": "\n".join(wrap(model.display_name or "", width=30)),
+                "ID": model.id,
+                "Name": model.display_name,
                 "Organization": model.organization,
                 "Type": model.type,
                 "Context Length": model.context_length,
-                "License": "\n".join(wrap(model.license or "", width=30)),
+                "License": model.license,
                 "Input per 1M token": model.pricing.input,
                 "Output per 1M token": model.pricing.output,
             }
         )
-    click.echo(tabulate(display_list, headers="keys", tablefmt="grid"))
+    if json:
+        click.echo(json_lib.dumps(display_list, indent=2))
+    else:
+        click.echo(tabulate(display_list, headers="keys", tablefmt="plain"))

{together-1.4.5 → together-1.4.6}/src/together/resources/endpoints.py RENAMED Viewed

@@ -59,6 +59,7 @@ class Endpoints:
         disable_prompt_cache: bool = False,
         disable_speculative_decoding: bool = False,
         state: Literal["STARTED", "STOPPED"] = "STARTED",
+        inactive_timeout: Optional[int] = None,
     ) -> DedicatedEndpoint:
         """
         Create a new dedicated endpoint.
@@ -72,6 +73,7 @@ class Endpoints:
             disable_prompt_cache (bool, optional): Whether to disable the prompt cache. Defaults to False.
             disable_speculative_decoding (bool, optional): Whether to disable speculative decoding. Defaults to False.
             state (str, optional): The desired state of the endpoint. Defaults to "STARTED".
+            inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
         Returns:
             DedicatedEndpoint: Object containing endpoint information
@@ -80,7 +82,7 @@ class Endpoints:
             client=self._client,
         )
-        data: Dict[str, Union[str, bool, Dict[str, int]]] = {
+        data: Dict[str, Union[str, bool, Dict[str, int], int]] = {
             "model": model,
             "hardware": hardware,
             "autoscaling": {
@@ -95,6 +97,9 @@ class Endpoints:
         if display_name is not None:
             data["display_name"] = display_name
+        if inactive_timeout is not None:
+            data["inactive_timeout"] = inactive_timeout
         response, _, _ = requestor.request(
             options=TogetherRequest(
                 method="POST",
@@ -161,6 +166,7 @@ class Endpoints:
         max_replicas: Optional[int] = None,
         state: Optional[Literal["STARTED", "STOPPED"]] = None,
         display_name: Optional[str] = None,
+        inactive_timeout: Optional[int] = None,
     ) -> DedicatedEndpoint:
         """
         Update an endpoint's configuration.
@@ -171,6 +177,7 @@ class Endpoints:
             max_replicas (int, optional): The maximum number of replicas to scale up to
             state (str, optional): The desired state of the endpoint ("STARTED" or "STOPPED")
             display_name (str, optional): A human-readable name for the endpoint
+            inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
         Returns:
             DedicatedEndpoint: Object containing endpoint information
@@ -179,7 +186,7 @@ class Endpoints:
             client=self._client,
         )
-        data: Dict[str, Union[str, Dict[str, int]]] = {}
+        data: Dict[str, Union[str, Dict[str, int], int]] = {}
         if min_replicas is not None or max_replicas is not None:
             current_min = min_replicas
@@ -200,6 +207,9 @@ class Endpoints:
         if display_name is not None:
             data["display_name"] = display_name
+        if inactive_timeout is not None:
+            data["inactive_timeout"] = inactive_timeout
         response, _, _ = requestor.request(
             options=TogetherRequest(
                 method="PATCH",
@@ -297,6 +307,7 @@ class AsyncEndpoints:
         disable_prompt_cache: bool = False,
         disable_speculative_decoding: bool = False,
         state: Literal["STARTED", "STOPPED"] = "STARTED",
+        inactive_timeout: Optional[int] = None,
     ) -> DedicatedEndpoint:
         """
         Create a new dedicated endpoint.
@@ -310,6 +321,7 @@ class AsyncEndpoints:
             disable_prompt_cache (bool, optional): Whether to disable the prompt cache. Defaults to False.
             disable_speculative_decoding (bool, optional): Whether to disable speculative decoding. Defaults to False.
             state (str, optional): The desired state of the endpoint. Defaults to "STARTED".
+            inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
         Returns:
             DedicatedEndpoint: Object containing endpoint information
@@ -318,7 +330,7 @@ class AsyncEndpoints:
             client=self._client,
         )
-        data: Dict[str, Union[str, bool, Dict[str, int]]] = {
+        data: Dict[str, Union[str, bool, Dict[str, int], int]] = {
             "model": model,
             "hardware": hardware,
             "autoscaling": {
@@ -333,6 +345,9 @@ class AsyncEndpoints:
         if display_name is not None:
             data["display_name"] = display_name
+        if inactive_timeout is not None:
+            data["inactive_timeout"] = inactive_timeout
         response, _, _ = await requestor.arequest(
             options=TogetherRequest(
                 method="POST",
@@ -399,6 +414,7 @@ class AsyncEndpoints:
         max_replicas: Optional[int] = None,
         state: Optional[Literal["STARTED", "STOPPED"]] = None,
         display_name: Optional[str] = None,
+        inactive_timeout: Optional[int] = None,
     ) -> DedicatedEndpoint:
         """
         Update an endpoint's configuration.
@@ -409,6 +425,7 @@ class AsyncEndpoints:
             max_replicas (int, optional): The maximum number of replicas to scale up to
             state (str, optional): The desired state of the endpoint ("STARTED" or "STOPPED")
             display_name (str, optional): A human-readable name for the endpoint
+            inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
         Returns:
             DedicatedEndpoint: Object containing endpoint information
@@ -417,7 +434,7 @@ class AsyncEndpoints:
             client=self._client,
         )
-        data: Dict[str, Union[str, Dict[str, int]]] = {}
+        data: Dict[str, Union[str, Dict[str, int], int]] = {}
         if min_replicas is not None or max_replicas is not None:
             current_min = min_replicas
@@ -438,6 +455,9 @@ class AsyncEndpoints:
         if display_name is not None:
             data["display_name"] = display_name
+        if inactive_timeout is not None:
+            data["inactive_timeout"] = inactive_timeout
         response, _, _ = await requestor.arequest(
             options=TogetherRequest(
                 method="PATCH",

together-1.4.6/src/together/resources/models.py ADDED Viewed

@@ -0,0 +1,134 @@
+from __future__ import annotations
+from typing import List
+from together.abstract import api_requestor
+from together.together_response import TogetherResponse
+from together.types import (
+    ModelObject,
+    TogetherClient,
+    TogetherRequest,
+)
+class ModelsBase:
+    def __init__(self, client: TogetherClient) -> None:
+        self._client = client
+    def _filter_dedicated_models(
+        self, models: List[ModelObject], dedicated_response: TogetherResponse
+    ) -> List[ModelObject]:
+        """
+        Filter models based on dedicated model response.
+        Args:
+            models (List[ModelObject]): List of all models
+            dedicated_response (TogetherResponse): Response from autoscale models endpoint
+        Returns:
+            List[ModelObject]: Filtered list of models
+        """
+        assert isinstance(dedicated_response.data, list)
+        # Create a set of dedicated model names for efficient lookup
+        dedicated_model_names = {model["name"] for model in dedicated_response.data}
+        # Filter models to only include those in dedicated_model_names
+        # Note: The model.id from ModelObject matches the name field in the autoscale response
+        return [model for model in models if model.id in dedicated_model_names]
+class Models(ModelsBase):
+    def list(
+        self,
+        dedicated: bool = False,
+    ) -> List[ModelObject]:
+        """
+        Method to return list of models on the API
+        Args:
+            dedicated (bool, optional): If True, returns only dedicated models. Defaults to False.
+        Returns:
+            List[ModelObject]: List of model objects
+        """
+        requestor = api_requestor.APIRequestor(
+            client=self._client,
+        )
+        response, _, _ = requestor.request(
+            options=TogetherRequest(
+                method="GET",
+                url="models",
+            ),
+            stream=False,
+        )
+        assert isinstance(response, TogetherResponse)
+        assert isinstance(response.data, list)
+        models = [ModelObject(**model) for model in response.data]
+        if dedicated:
+            # Get dedicated models
+            dedicated_response, _, _ = requestor.request(
+                options=TogetherRequest(
+                    method="GET",
+                    url="autoscale/models",
+                ),
+                stream=False,
+            )
+            models = self._filter_dedicated_models(models, dedicated_response)
+        models.sort(key=lambda x: x.id.lower())
+        return models
+class AsyncModels(ModelsBase):
+    async def list(
+        self,
+        dedicated: bool = False,
+    ) -> List[ModelObject]:
+        """
+        Async method to return list of models on API
+        Args:
+            dedicated (bool, optional): If True, returns only dedicated models. Defaults to False.
+        Returns:
+            List[ModelObject]: List of model objects
+        """
+        requestor = api_requestor.APIRequestor(
+            client=self._client,
+        )
+        response, _, _ = await requestor.arequest(
+            options=TogetherRequest(
+                method="GET",
+                url="models",
+            ),
+            stream=False,
+        )
+        assert isinstance(response, TogetherResponse)
+        assert isinstance(response.data, list)
+        models = [ModelObject(**model) for model in response.data]
+        if dedicated:
+            # Get dedicated models
+            dedicated_response, _, _ = await requestor.arequest(
+                options=TogetherRequest(
+                    method="GET",
+                    url="autoscale/models",
+                ),
+                stream=False,
+            )
+            models = self._filter_dedicated_models(models, dedicated_response)
+        models.sort(key=lambda x: x.id.lower())
+        return models

together-1.4.5/src/together/resources/models.py DELETED Viewed

@@ -1,75 +0,0 @@
-from __future__ import annotations
-from typing import List
-from together.abstract import api_requestor
-from together.together_response import TogetherResponse
-from together.types import (
-    ModelObject,
-    TogetherClient,
-    TogetherRequest,
-)
-class Models:
-    def __init__(self, client: TogetherClient) -> None:
-        self._client = client
-    def list(
-        self,
-    ) -> List[ModelObject]:
-        """
-        Method to return list of models on the API
-        Returns:
-            List[ModelObject]: List of model objects
-        """
-        requestor = api_requestor.APIRequestor(
-            client=self._client,
-        )
-        response, _, _ = requestor.request(
-            options=TogetherRequest(
-                method="GET",
-                url="models",
-            ),
-            stream=False,
-        )
-        assert isinstance(response, TogetherResponse)
-        assert isinstance(response.data, list)
-        return [ModelObject(**model) for model in response.data]
-class AsyncModels:
-    def __init__(self, client: TogetherClient) -> None:
-        self._client = client
-    async def list(
-        self,
-    ) -> List[ModelObject]:
-        """
-        Async method to return list of models on API
-        Returns:
-            List[ModelObject]: List of model objects
-        """
-        requestor = api_requestor.APIRequestor(
-            client=self._client,
-        )
-        response, _, _ = await requestor.arequest(
-            options=TogetherRequest(
-                method="GET",
-                url="models",
-            ),
-            stream=False,
-        )
-        assert isinstance(response, TogetherResponse)
-        assert isinstance(response.data, list)
-        return [ModelObject(**model) for model in response.data]

{together-1.4.5 → together-1.4.6}/LICENSE RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/README.md RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/abstract/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/abstract/api_requestor.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/chat.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/completions.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/files.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/finetune.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/images.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/api/utils.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/cli/cli.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/client.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/constants.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/error.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/filemanager.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/base.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/complete.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/embeddings.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/files.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/finetune.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/images.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/legacy/models.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/audio/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/audio/speech.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/chat/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/chat/completions.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/completions.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/embeddings.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/files.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/finetune.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/images.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/resources/rerank.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/together_response.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/abstract.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/audio_speech.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/chat_completions.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/common.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/completions.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/embeddings.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/endpoints.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/error.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/files.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/finetune.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/images.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/models.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/types/rerank.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/utils/__init__.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/utils/_log.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/utils/api_helpers.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/utils/files.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/utils/tools.py RENAMED Viewed

File without changes

{together-1.4.5 → together-1.4.6}/src/together/version.py RENAMED Viewed

File without changes

together 1.4.5__tar.gz → 1.4.6__tar.gz

together 1.4.5tar.gz → 1.4.6tar.gz