PyPI - together - Versions diffs - 2.0.0a8__py3-none-any.whl → 2.0.0a10__py3-none-any.whl - Mend

together 2.0.0a8py3-none-any.whl → 2.0.0a10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

together/_streaming.py +50 -48
together/_types.py +3 -2
together/_utils/_utils.py +1 -1
together/_version.py +1 -1
together/lib/cli/api/fine_tuning.py +65 -3
together/lib/cli/api/models.py +1 -6
together/lib/resources/fine_tuning.py +41 -2
together/resources/audio/transcriptions.py +20 -0
together/resources/chat/completions.py +48 -0
together/resources/fine_tuning.py +213 -5
together/resources/images.py +13 -1
together/resources/models.py +41 -5
together/types/__init__.py +3 -0
together/types/audio/transcription_create_params.py +14 -0
together/types/audio/voice_list_response.py +4 -0
together/types/autoscaling.py +2 -0
together/types/autoscaling_param.py +2 -0
together/types/chat/completion_create_params.py +78 -5
together/types/dedicated_endpoint.py +2 -0
together/types/endpoint_list_avzones_response.py +2 -0
together/types/endpoint_list_response.py +2 -0
together/types/execute_response.py +7 -0
together/types/fine_tuning_cancel_response.py +6 -0
together/types/fine_tuning_estimate_price_params.py +98 -0
together/types/fine_tuning_estimate_price_response.py +24 -0
together/types/fine_tuning_list_response.py +6 -0
together/types/hardware_list_response.py +8 -0
together/types/image_generate_params.py +9 -0
together/types/model_list_params.py +12 -0
together/types/video_job.py +8 -0
{together-2.0.0a8.dist-info → together-2.0.0a10.dist-info}/METADATA +11 -12
{together-2.0.0a8.dist-info → together-2.0.0a10.dist-info}/RECORD +35 -33
together/lib/resources/models.py +0 -35
{together-2.0.0a8.dist-info → together-2.0.0a10.dist-info}/WHEEL +0 -0
{together-2.0.0a8.dist-info → together-2.0.0a10.dist-info}/entry_points.txt +0 -0
{together-2.0.0a8.dist-info → together-2.0.0a10.dist-info}/licenses/LICENSE +0 -0

together/resources/fine_tuning.py CHANGED Viewed

@@ -7,7 +7,7 @@ from typing_extensions import Literal
 import httpx
 from rich import print as rprint
-from ..types import fine_tuning_delete_params, fine_tuning_content_params
+from ..types import fine_tuning_delete_params, fine_tuning_content_params, fine_tuning_estimate_price_params
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
 from .._utils import maybe_transform, async_maybe_transform
 from .._compat import cached_property
@@ -27,17 +27,31 @@ from .._response import (
     async_to_custom_streamed_response_wrapper,
 )
 from .._base_client import make_request_options
-from ..lib.types.fine_tuning import FinetuneResponse as FinetuneResponseLib, FinetuneTrainingLimits
+from ..lib.types.fine_tuning import (
+    FinetuneResponse as FinetuneResponseLib,
+    FinetuneTrainingLimits,
+)
 from ..types.finetune_response import FinetuneResponse
-from ..lib.resources.fine_tuning import get_model_limits, async_get_model_limits, create_finetune_request
+from ..lib.resources.fine_tuning import (
+    get_model_limits,
+    async_get_model_limits,
+    create_finetune_request,
+)
 from ..types.fine_tuning_list_response import FineTuningListResponse
 from ..types.fine_tuning_cancel_response import FineTuningCancelResponse
 from ..types.fine_tuning_delete_response import FineTuningDeleteResponse
 from ..types.fine_tuning_list_events_response import FineTuningListEventsResponse
+from ..types.fine_tuning_estimate_price_response import FineTuningEstimatePriceResponse
 from ..types.fine_tuning_list_checkpoints_response import FineTuningListCheckpointsResponse
 __all__ = ["FineTuningResource", "AsyncFineTuningResource"]
+_WARNING_MESSAGE_INSUFFICIENT_FUNDS = (
+    "The estimated price of the fine-tuning job is {} which is significantly "
+    "greater than your current credit limit and balance combined. "
+    "It will likely get cancelled due to insufficient funds. "
+    "Proceed at your own risk."
+)
 class FineTuningResource(SyncAPIResource):
     @cached_property
@@ -179,7 +193,7 @@ class FineTuningResource(SyncAPIResource):
                 pass
             model_limits = get_model_limits(self._client, str(model_name))
-        finetune_request = create_finetune_request(
+        finetune_request, training_type_cls, training_method_cls = create_finetune_request(
             model_limits=model_limits,
             training_file=training_file,
             model=model,
@@ -218,11 +232,32 @@ class FineTuningResource(SyncAPIResource):
             hf_output_repo_name=hf_output_repo_name,
         )
+        price_estimation_result = self.estimate_price(
+            training_file=training_file,
+            from_checkpoint=from_checkpoint or Omit(),
+            validation_file=validation_file or Omit(),
+            model=model or "",
+            n_epochs=finetune_request.n_epochs,
+            n_evals=finetune_request.n_evals or 0,
+            training_type=training_type_cls,
+            training_method=training_method_cls,
+        )
         if verbose:
             rprint(
                 "Submitting a fine-tuning job with the following parameters:",
                 finetune_request,
             )
+            if not price_estimation_result.allowed_to_proceed:
+                rprint(
+                    "[red]"
+                    + _WARNING_MESSAGE_INSUFFICIENT_FUNDS.format(
+                        price_estimation_result.estimated_total_price # pyright: ignore[reportPossiblyUnboundVariable]
+                    )
+                    + "[/red]",
+                )
         parameter_payload = finetune_request.model_dump(exclude_none=True)
         return self._client.post(
@@ -413,6 +448,76 @@ class FineTuningResource(SyncAPIResource):
             cast_to=BinaryAPIResponse,
         )
+    def estimate_price(
+        self,
+        *,
+        training_file: str,
+        from_checkpoint: str | Omit = omit,
+        model: str | Omit = omit,
+        n_epochs: int | Omit = omit,
+        n_evals: int | Omit = omit,
+        training_method: fine_tuning_estimate_price_params.TrainingMethod | Omit = omit,
+        training_type: fine_tuning_estimate_price_params.TrainingType | Omit = omit,
+        validation_file: str | Omit = omit,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = not_given,
+    ) -> FineTuningEstimatePriceResponse:
+        """
+        Estimate the price of a fine-tuning job.
+        Args:
+          training_file: File-ID of a training file uploaded to the Together API
+          from_checkpoint: The checkpoint identifier to continue training from a previous fine-tuning job.
+              Format is `{$JOB_ID}` or `{$OUTPUT_MODEL_NAME}` or `{$JOB_ID}:{$STEP}` or
+              `{$OUTPUT_MODEL_NAME}:{$STEP}`. The step value is optional; without it, the
+              final checkpoint will be used.
+          model: Name of the base model to run fine-tune job on
+          n_epochs: Number of complete passes through the training dataset (higher values may
+              improve results but increase cost and risk of overfitting)
+          n_evals: Number of evaluations to be run on a given validation set during training
+          training_method: The training method to use. 'sft' for Supervised Fine-Tuning or 'dpo' for Direct
+              Preference Optimization.
+          validation_file: File-ID of a validation file uploaded to the Together API
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return self._post(
+            "/fine-tunes/estimate-price",
+            body=maybe_transform(
+                {
+                    "training_file": training_file,
+                    "from_checkpoint": from_checkpoint,
+                    "model": model,
+                    "n_epochs": n_epochs,
+                    "n_evals": n_evals,
+                    "training_method": training_method,
+                    "training_type": training_type,
+                    "validation_file": validation_file,
+                },
+                fine_tuning_estimate_price_params.FineTuningEstimatePriceParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=FineTuningEstimatePriceResponse,
+        )
     def list_checkpoints(
         self,
         id: str,
@@ -620,7 +725,7 @@ class AsyncFineTuningResource(AsyncAPIResource):
                 pass
             model_limits = await async_get_model_limits(self._client, str(model_name))
-        finetune_request = create_finetune_request(
+        finetune_request, training_type_cls, training_method_cls = create_finetune_request(
             model_limits=model_limits,
             training_file=training_file,
             model=model,
@@ -659,11 +764,32 @@ class AsyncFineTuningResource(AsyncAPIResource):
             hf_output_repo_name=hf_output_repo_name,
         )
+        price_estimation_result = await self.estimate_price(
+            training_file=training_file,
+            from_checkpoint=from_checkpoint or Omit(),
+            validation_file=validation_file or Omit(),
+            model=model or "",
+            n_epochs=finetune_request.n_epochs,
+            n_evals=finetune_request.n_evals or 0,
+            training_type=training_type_cls,
+            training_method=training_method_cls,
+        )
         if verbose:
             rprint(
                 "Submitting a fine-tuning job with the following parameters:",
                 finetune_request,
             )
+            if not price_estimation_result.allowed_to_proceed:
+                rprint(
+                    "[red]"
+                    + _WARNING_MESSAGE_INSUFFICIENT_FUNDS.format(
+                        price_estimation_result.estimated_total_price # pyright: ignore[reportPossiblyUnboundVariable]
+                    )
+                    + "[/red]",
+                )
         parameter_payload = finetune_request.model_dump(exclude_none=True)
         return await self._client.post(
@@ -854,6 +980,76 @@ class AsyncFineTuningResource(AsyncAPIResource):
             cast_to=AsyncBinaryAPIResponse,
         )
+    async def estimate_price(
+        self,
+        *,
+        training_file: str,
+        from_checkpoint: str | Omit = omit,
+        model: str | Omit = omit,
+        n_epochs: int | Omit = omit,
+        n_evals: int | Omit = omit,
+        training_method: fine_tuning_estimate_price_params.TrainingMethod | Omit = omit,
+        training_type: fine_tuning_estimate_price_params.TrainingType | Omit = omit,
+        validation_file: str | Omit = omit,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = not_given,
+    ) -> FineTuningEstimatePriceResponse:
+        """
+        Estimate the price of a fine-tuning job.
+        Args:
+          training_file: File-ID of a training file uploaded to the Together API
+          from_checkpoint: The checkpoint identifier to continue training from a previous fine-tuning job.
+              Format is `{$JOB_ID}` or `{$OUTPUT_MODEL_NAME}` or `{$JOB_ID}:{$STEP}` or
+              `{$OUTPUT_MODEL_NAME}:{$STEP}`. The step value is optional; without it, the
+              final checkpoint will be used.
+          model: Name of the base model to run fine-tune job on
+          n_epochs: Number of complete passes through the training dataset (higher values may
+              improve results but increase cost and risk of overfitting)
+          n_evals: Number of evaluations to be run on a given validation set during training
+          training_method: The training method to use. 'sft' for Supervised Fine-Tuning or 'dpo' for Direct
+              Preference Optimization.
+          validation_file: File-ID of a validation file uploaded to the Together API
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        return await self._post(
+            "/fine-tunes/estimate-price",
+            body=await async_maybe_transform(
+                {
+                    "training_file": training_file,
+                    "from_checkpoint": from_checkpoint,
+                    "model": model,
+                    "n_epochs": n_epochs,
+                    "n_evals": n_evals,
+                    "training_method": training_method,
+                    "training_type": training_type,
+                    "validation_file": validation_file,
+                },
+                fine_tuning_estimate_price_params.FineTuningEstimatePriceParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=FineTuningEstimatePriceResponse,
+        )
     async def list_checkpoints(
         self,
         id: str,
@@ -941,6 +1137,9 @@ class FineTuningResourceWithRawResponse:
             fine_tuning.content,
             BinaryAPIResponse,
         )
+        self.estimate_price = to_raw_response_wrapper(
+            fine_tuning.estimate_price,
+        )
         self.list_checkpoints = to_raw_response_wrapper(
             fine_tuning.list_checkpoints,
         )
@@ -969,6 +1168,9 @@ class AsyncFineTuningResourceWithRawResponse:
             fine_tuning.content,
             AsyncBinaryAPIResponse,
         )
+        self.estimate_price = async_to_raw_response_wrapper(
+            fine_tuning.estimate_price,
+        )
         self.list_checkpoints = async_to_raw_response_wrapper(
             fine_tuning.list_checkpoints,
         )
@@ -997,6 +1199,9 @@ class FineTuningResourceWithStreamingResponse:
             fine_tuning.content,
             StreamedBinaryAPIResponse,
         )
+        self.estimate_price = to_streamed_response_wrapper(
+            fine_tuning.estimate_price,
+        )
         self.list_checkpoints = to_streamed_response_wrapper(
             fine_tuning.list_checkpoints,
         )
@@ -1025,6 +1230,9 @@ class AsyncFineTuningResourceWithStreamingResponse:
             fine_tuning.content,
             AsyncStreamedBinaryAPIResponse,
         )
+        self.estimate_price = async_to_streamed_response_wrapper(
+            fine_tuning.estimate_price,
+        )
         self.list_checkpoints = async_to_streamed_response_wrapper(
             fine_tuning.list_checkpoints,
         )

together/resources/images.py CHANGED Viewed

@@ -8,7 +8,7 @@ from typing_extensions import Literal
 import httpx
 from ..types import image_generate_params
-from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
+from .._types import Body, Omit, Query, Headers, NotGiven, SequenceNotStr, omit, not_given
 from .._utils import maybe_transform, async_maybe_transform
 from .._compat import cached_property
 from .._resource import SyncAPIResource, AsyncAPIResource
@@ -64,6 +64,7 @@ class ImagesResource(SyncAPIResource):
         n: int | Omit = omit,
         negative_prompt: str | Omit = omit,
         output_format: Literal["jpeg", "png"] | Omit = omit,
+        reference_images: SequenceNotStr[str] | Omit = omit,
         response_format: Literal["base64", "url"] | Omit = omit,
         seed: int | Omit = omit,
         steps: int | Omit = omit,
@@ -105,6 +106,10 @@ class ImagesResource(SyncAPIResource):
           output_format: The format of the image response. Can be either be `jpeg` or `png`. Defaults to
               `jpeg`.
+          reference_images: An array of image URLs that guide the overall appearance and style of the
+              generated image. These reference images influence the visual characteristics
+              consistently across the generation.
           response_format: Format of the image response. Can be either a base64 string or a URL.
           seed: Seed used for generation. Can be used to reproduce image generations.
@@ -135,6 +140,7 @@ class ImagesResource(SyncAPIResource):
                     "n": n,
                     "negative_prompt": negative_prompt,
                     "output_format": output_format,
+                    "reference_images": reference_images,
                     "response_format": response_format,
                     "seed": seed,
                     "steps": steps,
@@ -189,6 +195,7 @@ class AsyncImagesResource(AsyncAPIResource):
         n: int | Omit = omit,
         negative_prompt: str | Omit = omit,
         output_format: Literal["jpeg", "png"] | Omit = omit,
+        reference_images: SequenceNotStr[str] | Omit = omit,
         response_format: Literal["base64", "url"] | Omit = omit,
         seed: int | Omit = omit,
         steps: int | Omit = omit,
@@ -230,6 +237,10 @@ class AsyncImagesResource(AsyncAPIResource):
           output_format: The format of the image response. Can be either be `jpeg` or `png`. Defaults to
               `jpeg`.
+          reference_images: An array of image URLs that guide the overall appearance and style of the
+              generated image. These reference images influence the visual characteristics
+              consistently across the generation.
           response_format: Format of the image response. Can be either a base64 string or a URL.
           seed: Seed used for generation. Can be used to reproduce image generations.
@@ -260,6 +271,7 @@ class AsyncImagesResource(AsyncAPIResource):
                     "n": n,
                     "negative_prompt": negative_prompt,
                     "output_format": output_format,
+                    "reference_images": reference_images,
                     "response_format": response_format,
                     "seed": seed,
                     "steps": steps,

together/resources/models.py CHANGED Viewed

@@ -6,7 +6,7 @@ from typing_extensions import Literal
 import httpx
-from ..types import model_upload_params
+from ..types import model_list_params, model_upload_params
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
 from .._utils import maybe_transform, async_maybe_transform
 from .._compat import cached_property
@@ -47,6 +47,7 @@ class ModelsResource(SyncAPIResource):
     def list(
         self,
         *,
+        dedicated: bool | Omit = omit,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
@@ -54,11 +55,28 @@ class ModelsResource(SyncAPIResource):
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = not_given,
     ) -> ModelListResponse:
-        """Lists all of Together's open-source models"""
+        """
+        Lists all of Together's open-source models
+        Args:
+          dedicated: Filter models to only return dedicated models
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
         return self._get(
             "/models",
             options=make_request_options(
-                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+                extra_headers=extra_headers,
+                extra_query=extra_query,
+                extra_body=extra_body,
+                timeout=timeout,
+                query=maybe_transform({"dedicated": dedicated}, model_list_params.ModelListParams),
             ),
             cast_to=ModelListResponse,
         )
@@ -152,6 +170,7 @@ class AsyncModelsResource(AsyncAPIResource):
     async def list(
         self,
         *,
+        dedicated: bool | Omit = omit,
         # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
         # The extra values given here take precedence over values defined on the client or passed to this method.
         extra_headers: Headers | None = None,
@@ -159,11 +178,28 @@ class AsyncModelsResource(AsyncAPIResource):
         extra_body: Body | None = None,
         timeout: float | httpx.Timeout | None | NotGiven = not_given,
     ) -> ModelListResponse:
-        """Lists all of Together's open-source models"""
+        """
+        Lists all of Together's open-source models
+        Args:
+          dedicated: Filter models to only return dedicated models
+          extra_headers: Send extra headers
+          extra_query: Add additional query parameters to the request
+          extra_body: Add additional JSON properties to the request
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
         return await self._get(
             "/models",
             options=make_request_options(
-                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+                extra_headers=extra_headers,
+                extra_query=extra_query,
+                extra_body=extra_body,
+                timeout=timeout,
+                query=await async_maybe_transform({"dedicated": dedicated}, model_list_params.ModelListParams),
             ),
             cast_to=ModelListResponse,
         )

together/types/__init__.py CHANGED Viewed

@@ -26,6 +26,7 @@ from .execute_response import ExecuteResponse as ExecuteResponse
 from .autoscaling_param import AutoscalingParam as AutoscalingParam
 from .finetune_response import FinetuneResponse as FinetuneResponse
 from .job_list_response import JobListResponse as JobListResponse
+from .model_list_params import ModelListParams as ModelListParams
 from .tool_choice_param import ToolChoiceParam as ToolChoiceParam
 from .dedicated_endpoint import DedicatedEndpoint as DedicatedEndpoint
 from .eval_create_params import EvalCreateParams as EvalCreateParams
@@ -62,6 +63,8 @@ from .fine_tuning_delete_response import FineTuningDeleteResponse as FineTuningD
 from .endpoint_list_avzones_response import EndpointListAvzonesResponse as EndpointListAvzonesResponse
 from .code_interpreter_execute_params import CodeInterpreterExecuteParams as CodeInterpreterExecuteParams
 from .fine_tuning_list_events_response import FineTuningListEventsResponse as FineTuningListEventsResponse
+from .fine_tuning_estimate_price_params import FineTuningEstimatePriceParams as FineTuningEstimatePriceParams
+from .fine_tuning_estimate_price_response import FineTuningEstimatePriceResponse as FineTuningEstimatePriceResponse
 from .fine_tuning_list_checkpoints_response import (
     FineTuningListCheckpointsResponse as FineTuningListCheckpointsResponse,
 )

together/types/audio/transcription_create_params.py CHANGED Viewed

@@ -34,6 +34,20 @@ class TranscriptionCreateParams(TypedDict, total=False):
     If `auto` is provided, language is auto-detected.
     """
+    max_speakers: int
+    """Maximum number of speakers expected in the audio.
+    Used to improve diarization accuracy when the approximate number of speakers is
+    known.
+    """
+    min_speakers: int
+    """Minimum number of speakers expected in the audio.
+    Used to improve diarization accuracy when the approximate number of speakers is
+    known.
+    """
     model: Literal["openai/whisper-large-v3"]
     """Model to use for transcription"""

together/types/audio/voice_list_response.py CHANGED Viewed

@@ -14,10 +14,14 @@ class DataVoice(BaseModel):
 class Data(BaseModel):
+    """Represents a model with its available voices."""
     model: str
     voices: List[DataVoice]
 class VoiceListResponse(BaseModel):
+    """Response containing a list of models and their available voices."""
     data: List[Data]

together/types/autoscaling.py CHANGED Viewed

@@ -6,6 +6,8 @@ __all__ = ["Autoscaling"]
 class Autoscaling(BaseModel):
+    """Configuration for automatic scaling of replicas based on demand."""
     max_replicas: int
     """The maximum number of replicas to scale up to under load"""

together/types/autoscaling_param.py CHANGED Viewed

@@ -8,6 +8,8 @@ __all__ = ["AutoscalingParam"]
 class AutoscalingParam(TypedDict, total=False):
+    """Configuration for automatic scaling of replicas based on demand."""
     max_replicas: Required[int]
     """The maximum number of replicas to scale up to under load"""

together/types/chat/completion_create_params.py CHANGED Viewed

@@ -29,6 +29,10 @@ __all__ = [
     "FunctionCall",
     "FunctionCallName",
     "ResponseFormat",
+    "ResponseFormatText",
+    "ResponseFormatJsonSchema",
+    "ResponseFormatJsonSchemaJsonSchema",
+    "ResponseFormatJsonObject",
     "ToolChoice",
     "CompletionCreateParamsNonStreaming",
     "CompletionCreateParamsStreaming",
@@ -117,7 +121,16 @@ class CompletionCreateParamsBase(TypedDict, total=False):
     """
     response_format: ResponseFormat
-    """An object specifying the format that the model must output."""
+    """An object specifying the format that the model must output.
+    Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
+    Outputs which ensures the model will match your supplied JSON schema. Learn more
+    in the [Structured Outputs guide](https://docs.together.ai/docs/json-mode).
+    Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+    ensures the message the model generates is valid JSON. Using `json_schema` is
+    preferred for models that support it.
+    """
     safety_model: str
     """The name of the moderation model used to validate tokens.
@@ -297,13 +310,73 @@ class FunctionCallName(TypedDict, total=False):
 FunctionCall: TypeAlias = Union[Literal["none", "auto"], FunctionCallName]
-class ResponseFormat(TypedDict, total=False):
+class ResponseFormatText(TypedDict, total=False):
+    """Default response format. Used to generate text responses."""
+    type: Required[Literal["text"]]
+    """The type of response format being defined. Always `text`."""
+class ResponseFormatJsonSchemaJsonSchema(TypedDict, total=False):
+    """Structured Outputs configuration options, including a JSON Schema."""
+    name: Required[str]
+    """The name of the response format.
+    Must be a-z, A-Z, 0-9, or contain underscores and dashes, with a maximum length
+    of 64.
+    """
+    description: str
+    """
+    A description of what the response format is for, used by the model to determine
+    how to respond in the format.
+    """
     schema: Dict[str, object]
-    """The schema of the response format."""
+    """
+    The schema for the response format, described as a JSON Schema object. Learn how
+    to build JSON schemas [here](https://json-schema.org/).
+    """
+    strict: Optional[bool]
+    """
+    Whether to enable strict schema adherence when generating the output. If set to
+    true, the model will always follow the exact schema defined in the `schema`
+    field. Only a subset of JSON Schema is supported when `strict` is `true`. To
+    learn more, read the
+    [Structured Outputs guide](https://docs.together.ai/docs/json-mode).
+    """
+class ResponseFormatJsonSchema(TypedDict, total=False):
+    """JSON Schema response format.
+    Used to generate structured JSON responses.
+    Learn more about [Structured Outputs](https://docs.together.ai/docs/json-mode).
+    """
+    json_schema: Required[ResponseFormatJsonSchemaJsonSchema]
+    """Structured Outputs configuration options, including a JSON Schema."""
+    type: Required[Literal["json_schema"]]
+    """The type of response format being defined. Always `json_schema`."""
+class ResponseFormatJsonObject(TypedDict, total=False):
+    """JSON object response format.
+    An older method of generating JSON responses.
+    Using `json_schema` is recommended for models that support it. Note that the
+    model will not generate JSON without a system or user message instructing it
+    to do so.
+    """
+    type: Required[Literal["json_object"]]
+    """The type of response format being defined. Always `json_object`."""
-    type: str
-    """The type of the response format."""
+ResponseFormat: TypeAlias = Union[ResponseFormatText, ResponseFormatJsonSchema, ResponseFormatJsonObject]
 ToolChoice: TypeAlias = Union[str, ToolChoiceParam]

together/types/dedicated_endpoint.py CHANGED Viewed

@@ -10,6 +10,8 @@ __all__ = ["DedicatedEndpoint"]
 class DedicatedEndpoint(BaseModel):
+    """Details about a dedicated endpoint deployment"""
     id: str
     """Unique identifier for the endpoint"""

together/types/endpoint_list_avzones_response.py CHANGED Viewed

@@ -8,4 +8,6 @@ __all__ = ["EndpointListAvzonesResponse"]
 class EndpointListAvzonesResponse(BaseModel):
+    """List of unique availability zones"""
     avzones: List[str]

together/types/endpoint_list_response.py CHANGED Viewed

@@ -10,6 +10,8 @@ __all__ = ["EndpointListResponse", "Data"]
 class Data(BaseModel):
+    """Details about an endpoint when listed via the list endpoint"""
     id: str
     """Unique identifier for the endpoint"""

together 2.0.0a8__py3-none-any.whl → 2.0.0a10__py3-none-any.whl

together 2.0.0a8py3-none-any.whl → 2.0.0a10py3-none-any.whl