PyPI - together - Versions diffs - 1.5.35__py3-none-any.whl → 2.0.0a6__py3-none-any.whl - Mend

together 1.5.35py3-none-any.whl → 2.0.0a6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (208) hide show

together/__init__.py +101 -114
together/_base_client.py +1995 -0
together/_client.py +1033 -0
together/_compat.py +219 -0
together/_constants.py +14 -0
together/_exceptions.py +108 -0
together/_files.py +123 -0
together/_models.py +857 -0
together/_qs.py +150 -0
together/_resource.py +43 -0
together/_response.py +830 -0
together/_streaming.py +370 -0
together/_types.py +260 -0
together/_utils/__init__.py +64 -0
together/_utils/_compat.py +45 -0
together/_utils/_datetime_parse.py +136 -0
together/_utils/_logs.py +25 -0
together/_utils/_proxy.py +65 -0
together/_utils/_reflection.py +42 -0
together/_utils/_resources_proxy.py +24 -0
together/_utils/_streams.py +12 -0
together/_utils/_sync.py +58 -0
together/_utils/_transform.py +457 -0
together/_utils/_typing.py +156 -0
together/_utils/_utils.py +421 -0
together/_version.py +4 -0
together/lib/.keep +4 -0
together/lib/__init__.py +23 -0
together/{cli → lib/cli}/api/endpoints.py +66 -84
together/{cli/api/evaluation.py → lib/cli/api/evals.py} +152 -43
together/{cli → lib/cli}/api/files.py +20 -17
together/{cli/api/finetune.py → lib/cli/api/fine_tuning.py} +116 -172
together/{cli → lib/cli}/api/models.py +34 -27
together/lib/cli/api/utils.py +50 -0
together/{cli → lib/cli}/cli.py +16 -26
together/{constants.py → lib/constants.py} +11 -24
together/lib/resources/__init__.py +11 -0
together/lib/resources/files.py +999 -0
together/lib/resources/fine_tuning.py +280 -0
together/lib/resources/models.py +35 -0
together/lib/types/__init__.py +13 -0
together/lib/types/error.py +9 -0
together/lib/types/fine_tuning.py +397 -0
together/{utils → lib/utils}/__init__.py +6 -14
together/{utils → lib/utils}/_log.py +11 -16
together/{utils → lib/utils}/files.py +90 -288
together/lib/utils/serializer.py +10 -0
together/{utils → lib/utils}/tools.py +19 -55
together/resources/__init__.py +225 -39
together/resources/audio/__init__.py +72 -48
together/resources/audio/audio.py +198 -0
together/resources/audio/speech.py +574 -128
together/resources/audio/transcriptions.py +247 -261
together/resources/audio/translations.py +221 -241
together/resources/audio/voices.py +111 -41
together/resources/batches.py +417 -0
together/resources/chat/__init__.py +30 -21
together/resources/chat/chat.py +102 -0
together/resources/chat/completions.py +1063 -263
together/resources/code_interpreter/__init__.py +33 -0
together/resources/code_interpreter/code_interpreter.py +258 -0
together/resources/code_interpreter/sessions.py +135 -0
together/resources/completions.py +884 -225
together/resources/embeddings.py +172 -68
together/resources/endpoints.py +589 -490
together/resources/evals.py +452 -0
together/resources/files.py +397 -129
together/resources/fine_tuning.py +1033 -0
together/resources/hardware.py +181 -0
together/resources/images.py +258 -104
together/resources/jobs.py +214 -0
together/resources/models.py +223 -193
together/resources/rerank.py +190 -92
together/resources/videos.py +286 -214
together/types/__init__.py +66 -167
together/types/audio/__init__.py +10 -0
together/types/audio/speech_create_params.py +75 -0
together/types/audio/transcription_create_params.py +54 -0
together/types/audio/transcription_create_response.py +111 -0
together/types/audio/translation_create_params.py +40 -0
together/types/audio/translation_create_response.py +70 -0
together/types/audio/voice_list_response.py +23 -0
together/types/audio_speech_stream_chunk.py +16 -0
together/types/autoscaling.py +13 -0
together/types/autoscaling_param.py +15 -0
together/types/batch_create_params.py +24 -0
together/types/batch_create_response.py +14 -0
together/types/batch_job.py +45 -0
together/types/batch_list_response.py +10 -0
together/types/chat/__init__.py +18 -0
together/types/chat/chat_completion.py +60 -0
together/types/chat/chat_completion_chunk.py +61 -0
together/types/chat/chat_completion_structured_message_image_url_param.py +18 -0
together/types/chat/chat_completion_structured_message_text_param.py +13 -0
together/types/chat/chat_completion_structured_message_video_url_param.py +18 -0
together/types/chat/chat_completion_usage.py +13 -0
together/types/chat/chat_completion_warning.py +9 -0
together/types/chat/completion_create_params.py +329 -0
together/types/code_interpreter/__init__.py +5 -0
together/types/code_interpreter/session_list_response.py +31 -0
together/types/code_interpreter_execute_params.py +45 -0
together/types/completion.py +42 -0
together/types/completion_chunk.py +66 -0
together/types/completion_create_params.py +138 -0
together/types/dedicated_endpoint.py +44 -0
together/types/embedding.py +24 -0
together/types/embedding_create_params.py +31 -0
together/types/endpoint_create_params.py +43 -0
together/types/endpoint_list_avzones_response.py +11 -0
together/types/endpoint_list_params.py +18 -0
together/types/endpoint_list_response.py +41 -0
together/types/endpoint_update_params.py +27 -0
together/types/eval_create_params.py +263 -0
together/types/eval_create_response.py +16 -0
together/types/eval_list_params.py +21 -0
together/types/eval_list_response.py +10 -0
together/types/eval_status_response.py +100 -0
together/types/evaluation_job.py +139 -0
together/types/execute_response.py +108 -0
together/types/file_delete_response.py +13 -0
together/types/file_list.py +12 -0
together/types/file_purpose.py +9 -0
together/types/file_response.py +31 -0
together/types/file_type.py +7 -0
together/types/fine_tuning_cancel_response.py +194 -0
together/types/fine_tuning_content_params.py +24 -0
together/types/fine_tuning_delete_params.py +11 -0
together/types/fine_tuning_delete_response.py +12 -0
together/types/fine_tuning_list_checkpoints_response.py +21 -0
together/types/fine_tuning_list_events_response.py +12 -0
together/types/fine_tuning_list_response.py +199 -0
together/types/finetune_event.py +41 -0
together/types/finetune_event_type.py +33 -0
together/types/finetune_response.py +177 -0
together/types/hardware_list_params.py +16 -0
together/types/hardware_list_response.py +58 -0
together/types/image_data_b64.py +15 -0
together/types/image_data_url.py +15 -0
together/types/image_file.py +23 -0
together/types/image_generate_params.py +85 -0
together/types/job_list_response.py +47 -0
together/types/job_retrieve_response.py +43 -0
together/types/log_probs.py +18 -0
together/types/model_list_response.py +10 -0
together/types/model_object.py +42 -0
together/types/model_upload_params.py +36 -0
together/types/model_upload_response.py +23 -0
together/types/rerank_create_params.py +36 -0
together/types/rerank_create_response.py +36 -0
together/types/tool_choice.py +23 -0
together/types/tool_choice_param.py +23 -0
together/types/tools_param.py +23 -0
together/types/training_method_dpo.py +22 -0
together/types/training_method_sft.py +18 -0
together/types/video_create_params.py +86 -0
together/types/video_create_response.py +10 -0
together/types/video_job.py +57 -0
together-2.0.0a6.dist-info/METADATA +729 -0
together-2.0.0a6.dist-info/RECORD +165 -0
{together-1.5.35.dist-info → together-2.0.0a6.dist-info}/WHEEL +1 -1
together-2.0.0a6.dist-info/entry_points.txt +2 -0
{together-1.5.35.dist-info → together-2.0.0a6.dist-info}/licenses/LICENSE +1 -1
together/abstract/api_requestor.py +0 -770
together/cli/api/chat.py +0 -298
together/cli/api/completions.py +0 -119
together/cli/api/images.py +0 -93
together/cli/api/utils.py +0 -139
together/client.py +0 -186
together/error.py +0 -194
together/filemanager.py +0 -635
together/legacy/__init__.py +0 -0
together/legacy/base.py +0 -27
together/legacy/complete.py +0 -93
together/legacy/embeddings.py +0 -27
together/legacy/files.py +0 -146
together/legacy/finetune.py +0 -177
together/legacy/images.py +0 -27
together/legacy/models.py +0 -44
together/resources/batch.py +0 -165
together/resources/code_interpreter.py +0 -82
together/resources/evaluation.py +0 -808
together/resources/finetune.py +0 -1388
together/together_response.py +0 -50
together/types/abstract.py +0 -26
together/types/audio_speech.py +0 -311
together/types/batch.py +0 -54
together/types/chat_completions.py +0 -210
together/types/code_interpreter.py +0 -57
together/types/common.py +0 -67
together/types/completions.py +0 -107
together/types/embeddings.py +0 -35
together/types/endpoints.py +0 -123
together/types/error.py +0 -16
together/types/evaluation.py +0 -93
together/types/files.py +0 -93
together/types/finetune.py +0 -465
together/types/images.py +0 -42
together/types/models.py +0 -96
together/types/rerank.py +0 -43
together/types/videos.py +0 -69
together/utils/api_helpers.py +0 -124
together/version.py +0 -6
together-1.5.35.dist-info/METADATA +0 -583
together-1.5.35.dist-info/RECORD +0 -77
together-1.5.35.dist-info/entry_points.txt +0 -3
/together/{abstract → lib/cli}/__init__.py +0 -0
/together/{cli → lib/cli/api}/__init__.py +0 -0
/together/{cli/api/__init__.py → py.typed} +0 -0

together/{cli → lib/cli}/api/endpoints.py RENAMED Viewed

@@ -1,34 +1,30 @@
 from __future__ import annotations
-import json
 import sys
+import json
+from typing import Any, Dict, Literal, TypeVar, Callable, cast
 from functools import wraps
-from typing import Any, Callable, Dict, List, Literal, TypeVar, Union
 import click
-from together import Together
-from together.error import InvalidRequestError
-from together.types import DedicatedEndpoint, ListEndpoint
+from together import Together, omit
+from together.types import DedicatedEndpoint
+from together._exceptions import APIError
+from together.lib.utils.serializer import datetime_serializer
+from together.types.endpoint_list_response import Data as DedicatedEndpointListItem
-def print_endpoint(
-    endpoint: Union[DedicatedEndpoint, ListEndpoint],
-) -> None:
+def print_endpoint(endpoint: DedicatedEndpoint | DedicatedEndpointListItem) -> None:
     """Print endpoint details in a Docker-like format or JSON."""
     # Print header info
     click.echo(f"ID:\t\t{endpoint.id}")
     click.echo(f"Name:\t\t{endpoint.name}")
-    # Print type-specific fields
     if isinstance(endpoint, DedicatedEndpoint):
         click.echo(f"Display Name:\t{endpoint.display_name}")
         click.echo(f"Hardware:\t{endpoint.hardware}")
-        click.echo(
-            f"Autoscaling:\tMin={endpoint.autoscaling.min_replicas}, "
-            f"Max={endpoint.autoscaling.max_replicas}"
-        )
+        click.echo(f"Autoscaling:\tMin={endpoint.autoscaling.min_replicas}, Max={endpoint.autoscaling.max_replicas}")
     click.echo(f"Model:\t\t{endpoint.model}")
     click.echo(f"Type:\t\t{endpoint.type}")
@@ -40,15 +36,10 @@ def print_endpoint(
 F = TypeVar("F", bound=Callable[..., Any])
-def print_api_error(
-    e: InvalidRequestError,
-) -> None:
-    error_details = e.api_response.message
+def print_api_error(e: APIError) -> None:
+    error_details = cast(Dict[str, Any], e.body)["error"]["message"]
-    if error_details and (
-        "credentials" in error_details.lower()
-        or "authentication" in error_details.lower()
-    ):
+    if error_details and ("credentials" in error_details.lower() or "authentication" in error_details.lower()):
         click.echo("Error: Invalid API key or authentication failed", err=True)
     else:
         click.echo(f"Error: {error_details}", err=True)
@@ -61,7 +52,7 @@ def handle_api_errors(f: F) -> F:
     def wrapper(*args: Any, **kwargs: Any) -> Any:
         try:
             return f(*args, **kwargs)
-        except InvalidRequestError as e:
+        except APIError as e:
             print_api_error(e)
             sys.exit(1)
         except Exception as e:
@@ -98,7 +89,7 @@ def endpoints(ctx: click.Context) -> None:
 )
 @click.option(
     "--gpu",
-    type=click.Choice(["b200", "h200", "h100", "a100", "l40", "l40s", "rtx-6000"]),
+    type=click.Choice(["h100", "a100", "l40", "l40s", "rtx-6000"]),
     required=True,
     help="GPU type to use for inference",
 )
@@ -137,7 +128,8 @@ def endpoints(ctx: click.Context) -> None:
     help="Start endpoint in specified availability zone (e.g., us-central-4b)",
 )
 @click.option(
-    "--wait/--no-wait",
+    "--wait",
+    is_flag=True,
     default=True,
     help="Wait for the endpoint to be ready after creation",
 )
@@ -151,8 +143,8 @@ def create(
     gpu: str,
     gpu_count: int,
     display_name: str | None,
-    no_prompt_cache: bool,
-    no_speculative_decoding: bool,
+    no_prompt_cache: bool | None,
+    no_speculative_decoding: bool | None,
     no_auto_start: bool,
     inactive_timeout: int | None,
     availability_zone: str | None,
@@ -161,8 +153,6 @@ def create(
     """Create a new dedicated inference endpoint."""
     # Map GPU types to their full hardware ID names
     gpu_map = {
-        "b200": "nvidia_b200_180gb_sxm",
-        "h200": "nvidia_h200_140gb_sxm",
         "h100": "nvidia_h100_80gb_sxm",
         "a100": "nvidia_a100_80gb_pcie" if gpu_count == 1 else "nvidia_a100_80gb_sxm",
         "l40": "nvidia_l40",
@@ -176,21 +166,21 @@ def create(
         response = client.endpoints.create(
             model=model,
             hardware=hardware_id,
-            min_replicas=min_replicas,
-            max_replicas=max_replicas,
-            display_name=display_name,
-            disable_prompt_cache=no_prompt_cache,
-            disable_speculative_decoding=no_speculative_decoding,
+            autoscaling={
+                "min_replicas": min_replicas,
+                "max_replicas": max_replicas,
+            },
+            display_name=display_name or omit,
+            disable_prompt_cache=no_prompt_cache or omit,
+            disable_speculative_decoding=no_speculative_decoding or omit,
             state="STOPPED" if no_auto_start else "STARTED",
             inactive_timeout=inactive_timeout,
-            availability_zone=availability_zone,
+            extra_query={"availability_zone": availability_zone or omit},
         )
-    except InvalidRequestError as e:
+    except APIError as e:
         print_api_error(e)
-        if "check the hardware api" in str(e).lower():
-            fetch_and_print_hardware_options(
-                client=client, model=model, print_json=False, available=True
-            )
+        if "check the hardware api" in str(e.args[0]).lower() or "invalid hardware provided" in str(e.args[0]).lower():
+            fetch_and_print_hardware_options(client=client, model=model, print_json=False, available=True)
         sys.exit(1)
@@ -219,7 +209,7 @@ def create(
         import time
         click.echo("Waiting for endpoint to be ready...", err=True)
-        while client.endpoints.get(response.id).state != "STARTED":
+        while client.endpoints.retrieve(response.id).state != "STARTED":
             time.sleep(1)
         click.echo("Endpoint ready", err=True)
@@ -234,11 +224,11 @@ def create(
 @handle_api_errors
 def get(client: Together, endpoint_id: str, json: bool) -> None:
     """Get a dedicated inference endpoint."""
-    endpoint = client.endpoints.get(endpoint_id)
+    endpoint = client.endpoints.retrieve(endpoint_id)
     if json:
         import json as json_lib
-        click.echo(json_lib.dumps(endpoint.model_dump(), indent=2))
+        click.echo(json_lib.dumps(endpoint.model_dump(), indent=2, default=datetime_serializer))
     else:
         print_endpoint(endpoint)
@@ -258,37 +248,31 @@ def hardware(client: Together, model: str | None, json: bool, available: bool) -
     fetch_and_print_hardware_options(client, model, json, available)
-def fetch_and_print_hardware_options(
-    client: Together, model: str | None, print_json: bool, available: bool
-) -> None:
+def fetch_and_print_hardware_options(client: Together, model: str | None, print_json: bool, available: bool) -> None:
     """Print hardware options for a model."""
     message = "Available hardware options:" if available else "All hardware options:"
     click.echo(message, err=True)
-    hardware_options = client.endpoints.list_hardware(model)
+    hardware_options = client.hardware.list(model=model or omit)
+    # hardware_options = client.endpoints.list_hardware(model)
     if available:
-        hardware_options = [
+        hardware_options.data = [
             hardware
-            for hardware in hardware_options
-            if hardware.availability is not None
-            and hardware.availability.status == "available"
+            for hardware in hardware_options.data
+            if hardware.availability is not None and hardware.availability.status == "available"
         ]
     if print_json:
-        json_output = [hardware.model_dump() for hardware in hardware_options]
-        click.echo(json.dumps(json_output, indent=2))
+        json_output = [hardware.model_dump() for hardware in hardware_options.data]
+        click.echo(json.dumps(json_output, default=datetime_serializer, indent=2))
     else:
-        for hardware in hardware_options:
+        for hardware in hardware_options.data:
             click.echo(f"  {hardware.id}", err=True)
 @endpoints.command()
 @click.argument("endpoint-id", required=True)
-@click.option(
-    "--wait/--no-wait",
-    default=True,
-    help="Wait for the endpoint to stop",
-)
+@click.option("--wait", is_flag=True, default=True, help="Wait for the endpoint to stop")
 @click.pass_obj
 @handle_api_errors
 def stop(client: Together, endpoint_id: str, wait: bool) -> None:
@@ -300,7 +284,7 @@ def stop(client: Together, endpoint_id: str, wait: bool) -> None:
         import time
         click.echo("Waiting for endpoint to stop...", err=True)
-        while client.endpoints.get(endpoint_id).state != "STOPPED":
+        while client.endpoints.retrieve(endpoint_id).state != "STOPPED":
             time.sleep(1)
         click.echo("Endpoint stopped", err=True)
@@ -309,11 +293,7 @@ def stop(client: Together, endpoint_id: str, wait: bool) -> None:
 @endpoints.command()
 @click.argument("endpoint-id", required=True)
-@click.option(
-    "--wait/--no-wait",
-    default=True,
-    help="Wait for the endpoint to start",
-)
+@click.option("--wait", is_flag=True, default=True, help="Wait for the endpoint to start")
 @click.pass_obj
 @handle_api_errors
 def start(client: Together, endpoint_id: str, wait: bool) -> None:
@@ -325,7 +305,7 @@ def start(client: Together, endpoint_id: str, wait: bool) -> None:
         import time
         click.echo("Waiting for endpoint to start...", err=True)
-        while client.endpoints.get(endpoint_id).state != "STARTED":
+        while client.endpoints.retrieve(endpoint_id).state != "STARTED":
             time.sleep(1)
         click.echo("Endpoint started", err=True)
@@ -371,8 +351,10 @@ def list(
     mine: bool | None,
 ) -> None:
     """List all inference endpoints (includes both dedicated and serverless endpoints)."""
-    endpoints: List[ListEndpoint] = client.endpoints.list(
-        type=type, usage_type=usage_type, mine=mine
+    endpoints = client.endpoints.list(
+        type=type or omit,
+        usage_type=usage_type or omit,
+        mine=mine if mine is not None else omit,
     )
     if not endpoints:
@@ -384,10 +366,12 @@ def list(
         import json as json_lib
         click.echo(
-            json_lib.dumps([endpoint.model_dump() for endpoint in endpoints], indent=2)
+            json_lib.dumps(
+                [endpoint.model_dump() for endpoint in endpoints.data], default=datetime_serializer, indent=2
+            )
         )
     else:
-        for endpoint in endpoints:
+        for endpoint in endpoints.data:
             print_endpoint(
                 endpoint,
             )
@@ -430,32 +414,30 @@ def update(
         click.echo("Error: At least one update option must be specified", err=True)
         sys.exit(1)
-    # If only one of min/max replicas is specified, we need both for the update
-    if (min_replicas is None) != (max_replicas is None):
-        click.echo(
-            "Error: Both --min-replicas and --max-replicas must be specified together",
-            err=True,
-        )
-        sys.exit(1)
     # Build kwargs for the update
     kwargs: Dict[str, Any] = {}
     if display_name is not None:
         kwargs["display_name"] = display_name
-    if min_replicas is not None and max_replicas is not None:
-        kwargs["min_replicas"] = min_replicas
-        kwargs["max_replicas"] = max_replicas
+    if min_replicas is not None or max_replicas is not None:
+        kwargs["autoscaling"] = {}
+        if min_replicas is not None:
+            kwargs["autoscaling"]["min_replicas"] = min_replicas
+        if max_replicas is not None:
+            kwargs["autoscaling"]["max_replicas"] = max_replicas
     if inactive_timeout is not None:
         kwargs["inactive_timeout"] = inactive_timeout
-    _response = client.endpoints.update(endpoint_id, **kwargs)
+    client.endpoints.update(endpoint_id, **kwargs)
     # Print what was updated
     click.echo("Updated endpoint configuration:", err=True)
     if display_name:
         click.echo(f"  Display name: {display_name}", err=True)
-    if min_replicas is not None and max_replicas is not None:
+    if min_replicas:
         click.echo(f"  Min replicas: {min_replicas}", err=True)
+    if max_replicas:
         click.echo(f"  Max replicas: {max_replicas}", err=True)
     if inactive_timeout is not None:
         click.echo(f"  Inactive timeout: {inactive_timeout} minutes", err=True)
@@ -479,8 +461,8 @@ def availability_zones(client: Together, json: bool) -> None:
     if json:
         import json as json_lib
-        click.echo(json_lib.dumps({"avzones": avzones}, indent=2))
+        click.echo(json_lib.dumps(avzones.model_dump(), indent=2))
     else:
         click.echo("Available zones:", err=True)
-        for availability_zone in sorted(avzones):
+        for availability_zone in sorted(avzones.avzones):
             click.echo(f"  {availability_zone}")

together/{cli/api/evaluation.py → lib/cli/api/evals.py} RENAMED Viewed

@@ -1,21 +1,72 @@
+import sys
 import json
-from typing import Optional, Dict, Union, Any
+from typing import Any, Dict, List, Union, Literal, TypeVar, Callable, Optional, cast
+from functools import wraps
 import click
 from tabulate import tabulate
-from together import Together
-from together.utils import convert_unix_timestamp
+from together import APIError, Together, TogetherError
+from together._types import omit
+from together.lib.utils.serializer import datetime_serializer
+from together.types.eval_create_params import (
+    ParametersEvaluationScoreParameters,
+    ParametersEvaluationCompareParameters,
+    ParametersEvaluationClassifyParameters,
+    ParametersEvaluationScoreParametersJudge,
+    ParametersEvaluationCompareParametersJudge,
+    ParametersEvaluationClassifyParametersJudge,
+    ParametersEvaluationScoreParametersModelToEvaluate,
+    ParametersEvaluationClassifyParametersModelToEvaluate,
+    ParametersEvaluationCompareParametersModelAEvaluationModelRequest,
+    ParametersEvaluationCompareParametersModelBEvaluationModelRequest,
+)
+def print_api_error(e: Union[APIError, TogetherError]) -> None:
+    if isinstance(e, APIError):
+        error_details = cast(Dict[str, Any], e.body)["error"]["message"]
+        if error_details and ("credentials" in error_details.lower() or "authentication" in error_details.lower()):
+            click.echo("Error: Invalid API key or authentication failed", err=True)
+        else:
+            click.echo(f"Error: {error_details}", err=True)
+    click.echo(f"Error: {e}", err=True)
+    return
+F = TypeVar("F", bound=Callable[..., Any])
+def handle_api_errors(f: F) -> F:
+    """Decorator to handle common API errors in CLI commands."""
+    @wraps(f)
+    def wrapper(*args: Any, **kwargs: Any) -> Any:
+        try:
+            return f(*args, **kwargs)
+        except APIError as e:
+            print_api_error(e)
+            sys.exit(1)
+        except TogetherError as e:
+            print_api_error(e)
+            sys.exit(1)
+        except Exception as e:
+            click.echo(f"Error: An unexpected error occurred - {str(e)}", err=True)
+            sys.exit(1)
+    return wrapper  # type: ignore
 @click.group()
 @click.pass_context
-def evaluation(ctx: click.Context) -> None:
-    """Evaluation API commands"""
+def evals(ctx: click.Context) -> None:
+    """Evals API commands"""
     pass
-@evaluation.command()
+@evals.command()
 @click.pass_context
 @click.option(
     "--type",
@@ -222,11 +273,12 @@ def evaluation(ctx: click.Context) -> None:
     type=str,
     help="Input template for model B.",
 )
+@handle_api_errors
 def create(
     ctx: click.Context,
-    type: str,
+    type: Literal["classify", "score", "compare"],
     judge_model: str,
-    judge_model_source: str,
+    judge_model_source: Literal["serverless", "dedicated", "external"],
     judge_system_template: str,
     judge_external_api_token: Optional[str],
     judge_external_base_url: Optional[str],
@@ -307,13 +359,9 @@ def create(
             "input_template": model_to_evaluate_input_template,
         }
         if model_to_evaluate_external_api_token:
-            model_to_evaluate_final["external_api_token"] = (
-                model_to_evaluate_external_api_token
-            )
+            model_to_evaluate_final["external_api_token"] = model_to_evaluate_external_api_token
         if model_to_evaluate_external_base_url:
-            model_to_evaluate_final["external_base_url"] = (
-                model_to_evaluate_external_base_url
-            )
+            model_to_evaluate_final["external_base_url"] = model_to_evaluate_external_base_url
     # Build model-a configuration
     model_a_final: Union[Dict[str, Any], None, str] = None
@@ -385,35 +433,55 @@ def create(
         if model_b_external_base_url:
             model_b_final["external_base_url"] = model_b_external_base_url
-    try:
-        response = client.evaluation.create(
+    judge_config = _build_judge(
+        type, judge_model, judge_model_source, judge_system_template, judge_external_api_token, judge_external_base_url
+    )
+    if type == "classify":
+        response = client.evals.create(
+            type=type,
+            parameters=ParametersEvaluationClassifyParameters(
+                input_data_file_path=input_data_file_path,
+                judge=judge_config,
+                labels=labels_list or [],
+                pass_labels=pass_labels_list or [],
+                model_to_evaluate=cast(ParametersEvaluationClassifyParametersModelToEvaluate, model_to_evaluate_final),
+            ),
+        )
+    elif type == "score":
+        if max_score is None or min_score is None or pass_threshold is None:
+            raise TogetherError("max_score, min_score, and pass_threshold are required for score type")
+        response = client.evals.create(
+            type="score",
+            parameters=ParametersEvaluationScoreParameters(
+                input_data_file_path=input_data_file_path,
+                judge=judge_config,
+                max_score=max_score,
+                min_score=min_score,
+                pass_threshold=pass_threshold,
+                model_to_evaluate=cast(ParametersEvaluationScoreParametersModelToEvaluate, model_to_evaluate_final),
+            ),
+        )
+    elif type == "compare":
+        response = client.evals.create(
             type=type,
-            judge_model=judge_model,
-            judge_model_source=judge_model_source,
-            judge_system_template=judge_system_template,
-            judge_external_api_token=judge_external_api_token,
-            judge_external_base_url=judge_external_base_url,
-            input_data_file_path=input_data_file_path,
-            model_to_evaluate=model_to_evaluate_final,
-            labels=labels_list,
-            pass_labels=pass_labels_list,
-            min_score=min_score,
-            max_score=max_score,
-            pass_threshold=pass_threshold,
-            model_a=model_a_final,
-            model_b=model_b_final,
+            parameters=ParametersEvaluationCompareParameters(
+                input_data_file_path=input_data_file_path,
+                judge=judge_config,
+                model_a=cast(ParametersEvaluationCompareParametersModelAEvaluationModelRequest, model_a_final),
+                model_b=cast(ParametersEvaluationCompareParametersModelBEvaluationModelRequest, model_b_final),
+            ),
         )
-    except ValueError as e:
-        raise click.BadParameter(str(e))
     click.echo(json.dumps(response.model_dump(exclude_none=True), indent=4))
-@evaluation.command()
+@evals.command()
 @click.pass_context
 @click.option(
     "--status",
-    type=str,
+    type=click.Choice(["pending", "queued", "running", "completed", "error", "user_error"]),
     help="Filter by job status.",
 )
 @click.option(
@@ -421,14 +489,18 @@ def create(
     type=int,
     help="Limit number of results (max 100).",
 )
-def list(ctx: click.Context, status: Optional[str], limit: Optional[int]) -> None:
-    """List evaluation jobs"""
+def list(
+    ctx: click.Context,
+    status: Union[Literal["pending", "queued", "running", "completed", "error", "user_error"], None],
+    limit: Union[int, None],
+) -> None:
+    """List evals"""
     client: Together = ctx.obj
-    response = client.evaluation.list(status=status, limit=limit)
+    response = client.evals.list(status=status or omit, limit=limit or omit)
-    display_list = []
+    display_list: List[Dict[str, Any]] = []
     for job in response:
         if job.parameters:
             model = job.parameters.get("model_to_evaluate", "")
@@ -436,6 +508,8 @@ def list(ctx: click.Context, status: Optional[str], limit: Optional[int]) -> Non
             model_b = job.parameters.get("model_b", "")
         else:
             model = ""
+            model_a = ""
+            model_b = ""
         display_list.append(
             {
@@ -453,7 +527,7 @@ def list(ctx: click.Context, status: Optional[str], limit: Optional[int]) -> Non
     click.echo(table)
-@evaluation.command()
+@evals.command()
 @click.pass_context
 @click.argument("evaluation_id", type=str, required=True)
 def retrieve(ctx: click.Context, evaluation_id: str) -> None:
@@ -461,12 +535,12 @@ def retrieve(ctx: click.Context, evaluation_id: str) -> None:
     client: Together = ctx.obj
-    response = client.evaluation.retrieve(evaluation_id=evaluation_id)
+    response = client.evals.retrieve(evaluation_id)
-    click.echo(json.dumps(response.model_dump(exclude_none=True), indent=4))
+    click.echo(json.dumps(response.model_dump(exclude_none=True), default=datetime_serializer, indent=4))
-@evaluation.command()
+@evals.command()
 @click.pass_context
 @click.argument("evaluation_id", type=str, required=True)
 def status(ctx: click.Context, evaluation_id: str) -> None:
@@ -474,6 +548,41 @@ def status(ctx: click.Context, evaluation_id: str) -> None:
     client: Together = ctx.obj
-    response = client.evaluation.status(evaluation_id=evaluation_id)
+    response = client.evals.status(evaluation_id)
     click.echo(json.dumps(response.model_dump(exclude_none=True), indent=4))
+def _build_judge(
+    type: Literal["classify", "score", "compare"],
+    judge_model: str,
+    judge_model_source: Literal["serverless", "dedicated", "external"],
+    judge_system_template: str,
+    judge_external_api_token: Optional[str],
+    judge_external_base_url: Optional[str],
+) -> ParametersEvaluationClassifyParametersJudge:
+    if type == "classify":
+        judge_config = ParametersEvaluationClassifyParametersJudge(
+            model=judge_model,
+            model_source=judge_model_source,
+            system_template=judge_system_template,
+        )
+    elif type == "score":
+        judge_config = ParametersEvaluationScoreParametersJudge(
+            model=judge_model,
+            model_source=judge_model_source,
+            system_template=judge_system_template,
+        )
+    elif type == "compare":
+        judge_config = ParametersEvaluationCompareParametersJudge(
+            model=judge_model,
+            model_source=judge_model_source,
+            system_template=judge_system_template,
+        )
+    if judge_external_api_token:
+        judge_config["external_api_token"] = judge_external_api_token
+    if judge_external_base_url:
+        judge_config["external_base_url"] = judge_external_base_url
+    return judge_config

together 1.5.35__py3-none-any.whl → 2.0.0a6__py3-none-any.whl

together 1.5.35py3-none-any.whl → 2.0.0a6py3-none-any.whl