PyPI - together - Versions diffs - 1.5.33__tar.gz → 1.5.35__tar.gz - Mend

together 1.5.33tar.gz → 1.5.35tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (76) hide show

{together-1.5.33 → together-1.5.35}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: together
-Version: 1.5.33
+Version: 1.5.35
 Summary: Python client for Together's Cloud Platform! Note: SDK 2.0 is now available at https://github.com/togethercomputer/together-py
 License: Apache-2.0
 License-File: LICENSE

{together-1.5.33 → together-1.5.35}/pyproject.toml RENAMED Viewed

@@ -12,7 +12,7 @@ build-backend = "poetry.masonry.api"
 [tool.poetry]
 name = "together"
-version = "1.5.33"
+version = "1.5.35"
 authors = ["Together AI <support@together.ai>"]
 description = "Python client for Together's Cloud Platform! Note: SDK 2.0 is now available at https://github.com/togethercomputer/together-py"
 readme = "README.md"

{together-1.5.33 → together-1.5.35}/src/together/cli/api/endpoints.py RENAMED Viewed

@@ -98,7 +98,7 @@ def endpoints(ctx: click.Context) -> None:
 )
 @click.option(
     "--gpu",
-    type=click.Choice(["h100", "a100", "l40", "l40s", "rtx-6000"]),
+    type=click.Choice(["b200", "h200", "h100", "a100", "l40", "l40s", "rtx-6000"]),
     required=True,
     help="GPU type to use for inference",
 )
@@ -161,6 +161,8 @@ def create(
     """Create a new dedicated inference endpoint."""
     # Map GPU types to their full hardware ID names
     gpu_map = {
+        "b200": "nvidia_b200_180gb_sxm",
+        "h200": "nvidia_h200_140gb_sxm",
         "h100": "nvidia_h100_80gb_sxm",
         "a100": "nvidia_a100_80gb_pcie" if gpu_count == 1 else "nvidia_a100_80gb_sxm",
         "l40": "nvidia_l40",

{together-1.5.33 → together-1.5.35}/src/together/cli/api/finetune.py RENAMED Viewed

@@ -1,7 +1,6 @@
 from __future__ import annotations
 import json
-import re
 from datetime import datetime, timezone
 from textwrap import wrap
 from typing import Any, Literal
@@ -14,18 +13,11 @@ from tabulate import tabulate
 from together import Together
 from together.cli.api.utils import BOOL_WITH_AUTO, INT_WITH_MAX, generate_progress_bar
-from together.types.finetune import (
-    DownloadCheckpointType,
-    FinetuneEventType,
-    FinetuneTrainingLimits,
-    FullTrainingType,
-    LoRATrainingType,
-)
+from together.types.finetune import DownloadCheckpointType, FinetuneTrainingLimits
 from together.utils import (
     finetune_price_to_dollars,
     format_timestamp,
     log_warn,
-    log_warn_once,
     parse_timestamp,
 )
@@ -203,6 +195,12 @@ def fine_tuning(ctx: click.Context) -> None:
     help="Whether to mask the user messages in conversational data or prompts in instruction data. "
     "`auto` will automatically determine whether to mask the inputs based on the data format.",
 )
+@click.option(
+    "--train-vision",
+    type=bool,
+    default=False,
+    help="Whether to train the vision encoder. Only supported for multimodal models.",
+)
 @click.option(
     "--from-checkpoint",
     type=str,
@@ -258,6 +256,7 @@ def create(
     lora_dropout: float,
     lora_alpha: float,
     lora_trainable_modules: str,
+    train_vision: bool,
     suffix: str,
     wandb_api_key: str,
     wandb_base_url: str,
@@ -299,6 +298,7 @@ def create(
         lora_dropout=lora_dropout,
         lora_alpha=lora_alpha,
         lora_trainable_modules=lora_trainable_modules,
+        train_vision=train_vision,
         suffix=suffix,
         wandb_api_key=wandb_api_key,
         wandb_base_url=wandb_base_url,
@@ -368,6 +368,10 @@ def create(
             "You have specified a number of evaluation loops but no validation file."
         )
+    if model_limits.supports_vision:
+        # Don't show price estimation for multimodal models yet
+        confirm = True
     finetune_price_estimation_result = client.fine_tuning.estimate_price(
         training_file=training_file,
         validation_file=validation_file,

{together-1.5.33 → together-1.5.35}/src/together/cli/api/utils.py RENAMED Viewed

@@ -103,13 +103,13 @@ def generate_progress_bar(
     progress = "Progress: [bold red]unavailable[/bold red]"
     if finetune_job.status in COMPLETED_STATUSES:
         progress = "Progress: [bold green]completed[/bold green]"
-    elif finetune_job.updated_at is not None:
+    elif finetune_job.started_at is not None:
         # Replace 'Z' with '+00:00' for Python 3.10 compatibility
-        updated_at_str = finetune_job.updated_at.replace("Z", "+00:00")
-        update_at = datetime.fromisoformat(updated_at_str).astimezone()
+        started_at_str = finetune_job.started_at.replace("Z", "+00:00")
+        started_at = datetime.fromisoformat(started_at_str).astimezone()
         if finetune_job.progress is not None:
-            if current_time < update_at:
+            if current_time < started_at:
                 return progress
             if not finetune_job.progress.estimate_available:
@@ -118,7 +118,7 @@ def generate_progress_bar(
             if finetune_job.progress.seconds_remaining <= 0:
                 return progress
-            elapsed_time = (current_time - update_at).total_seconds()
+            elapsed_time = (current_time - started_at).total_seconds()
             ratio_filled = min(
                 elapsed_time / finetune_job.progress.seconds_remaining, 1.0
             )

{together-1.5.33 → together-1.5.35}/src/together/constants.py RENAMED Viewed

@@ -1,5 +1,6 @@
 import enum
 # Session constants
 TIMEOUT_SECS = 600
 MAX_SESSION_LIFETIME_SECS = 180
@@ -40,6 +41,11 @@ MIN_SAMPLES = 1
 # the number of bytes in a gigabyte, used to convert bytes to GB for readable comparison
 NUM_BYTES_IN_GB = 2**30
+# Multimodal limits
+MAX_IMAGES_PER_EXAMPLE = 10
+MAX_IMAGE_BYTES = 10 * 1024 * 1024  # 10MB
+# Max length = Header length + base64 factor (4/3) * image bytes
+MAX_BASE64_IMAGE_LENGTH = len("data:image/jpeg;base64,") + 4 * MAX_IMAGE_BYTES // 3
 # expected columns for Parquet files
 PARQUET_EXPECTED_COLUMNS = ["input_ids", "attention_mask", "labels"]

{together-1.5.33 → together-1.5.35}/src/together/resources/endpoints.py RENAMED Viewed

@@ -1,5 +1,6 @@
 from __future__ import annotations
+import warnings
 from typing import Dict, List, Literal, Optional, Union
 from together.abstract import api_requestor
@@ -96,6 +97,12 @@ class Endpoints:
         Returns:
             DedicatedEndpoint: Object containing endpoint information
         """
+        if disable_prompt_cache:
+            warnings.warn(
+                "The 'disable_prompt_cache' parameter (CLI flag: '--no-prompt-cache') is deprecated and will be removed in a future version.",
+                stacklevel=2,
+            )
         requestor = api_requestor.APIRequestor(
             client=self._client,
         )
@@ -389,6 +396,12 @@ class AsyncEndpoints:
         Returns:
             DedicatedEndpoint: Object containing endpoint information
         """
+        if disable_prompt_cache:
+            warnings.warn(
+                "The 'disable_prompt_cache' parameter (CLI flag: '--no-prompt-cache') is deprecated and will be removed in a future version.",
+                stacklevel=2,
+            )
         requestor = api_requestor.APIRequestor(
             client=self._client,
         )

{together-1.5.33 → together-1.5.35}/src/together/resources/finetune.py RENAMED Viewed

@@ -2,7 +2,7 @@ from __future__ import annotations
 import re
 from pathlib import Path
-from typing import List, Dict, Literal
+from typing import Dict, List, Literal
 from rich import print as rprint
@@ -18,10 +18,11 @@ from together.types import (
     FinetuneList,
     FinetuneListEvents,
     FinetuneLRScheduler,
-    FinetuneRequest,
-    FinetuneResponse,
+    FinetuneMultimodalParams,
     FinetunePriceEstimationRequest,
     FinetunePriceEstimationResponse,
+    FinetuneRequest,
+    FinetuneResponse,
     FinetuneTrainingLimits,
     FullTrainingType,
     LinearLRScheduler,
@@ -73,6 +74,7 @@ def create_finetune_request(
     lora_dropout: float | None = 0,
     lora_alpha: float | None = None,
     lora_trainable_modules: str | None = "all-linear",
+    train_vision: bool = False,
     suffix: str | None = None,
     wandb_api_key: str | None = None,
     wandb_base_url: str | None = None,
@@ -252,6 +254,15 @@ def create_finetune_request(
             simpo_gamma=simpo_gamma,
         )
+    if model_limits.supports_vision:
+        multimodal_params = FinetuneMultimodalParams(train_vision=train_vision)
+    elif not model_limits.supports_vision and train_vision:
+        raise ValueError(
+            f"Vision encoder training is not supported for the non-multimodal model `{model}`"
+        )
+    else:
+        multimodal_params = None
     finetune_request = FinetuneRequest(
         model=model,
         training_file=training_file,
@@ -272,6 +283,7 @@ def create_finetune_request(
         wandb_project_name=wandb_project_name,
         wandb_name=wandb_name,
         training_method=training_method_cls,
+        multimodal_params=multimodal_params,
         from_checkpoint=from_checkpoint,
         from_hf_model=from_hf_model,
         hf_model_revision=hf_model_revision,
@@ -342,6 +354,7 @@ class FineTuning:
         lora_dropout: float | None = 0,
         lora_alpha: float | None = None,
         lora_trainable_modules: str | None = "all-linear",
+        train_vision: bool = False,
         suffix: str | None = None,
         wandb_api_key: str | None = None,
         wandb_base_url: str | None = None,
@@ -387,6 +400,7 @@ class FineTuning:
             lora_dropout (float, optional): Dropout rate for LoRA adapters. Defaults to 0.
             lora_alpha (float, optional): Alpha for LoRA adapters. Defaults to 8.
             lora_trainable_modules (str, optional): Trainable modules for LoRA adapters. Defaults to "all-linear".
+            train_vision (bool, optional): Whether to train vision encoder in multimodal models. Defaults to False.
             suffix (str, optional): Up to 40 character suffix that will be added to your fine-tuned model name.
                 Defaults to None.
             wandb_api_key (str, optional): API key for Weights & Biases integration.
@@ -464,6 +478,7 @@ class FineTuning:
             lora_dropout=lora_dropout,
             lora_alpha=lora_alpha,
             lora_trainable_modules=lora_trainable_modules,
+            train_vision=train_vision,
             suffix=suffix,
             wandb_api_key=wandb_api_key,
             wandb_base_url=wandb_base_url,
@@ -906,6 +921,7 @@ class AsyncFineTuning:
         lora_dropout: float | None = 0,
         lora_alpha: float | None = None,
         lora_trainable_modules: str | None = "all-linear",
+        train_vision: bool = False,
         suffix: str | None = None,
         wandb_api_key: str | None = None,
         wandb_base_url: str | None = None,
@@ -951,6 +967,7 @@ class AsyncFineTuning:
             lora_dropout (float, optional): Dropout rate for LoRA adapters. Defaults to 0.
             lora_alpha (float, optional): Alpha for LoRA adapters. Defaults to 8.
             lora_trainable_modules (str, optional): Trainable modules for LoRA adapters. Defaults to "all-linear".
+            train_vision (bool, optional): Whether to train vision encoder in multimodal models. Defaults to False.
             suffix (str, optional): Up to 40 character suffix that will be added to your fine-tuned model name.
                 Defaults to None.
             wandb_api_key (str, optional): API key for Weights & Biases integration.
@@ -1028,6 +1045,7 @@ class AsyncFineTuning:
             lora_dropout=lora_dropout,
             lora_alpha=lora_alpha,
             lora_trainable_modules=lora_trainable_modules,
+            train_vision=train_vision,
             suffix=suffix,
             wandb_api_key=wandb_api_key,
             wandb_base_url=wandb_base_url,
@@ -1046,7 +1064,11 @@ class AsyncFineTuning:
             hf_output_repo_name=hf_output_repo_name,
         )
-        if from_checkpoint is None and from_hf_model is None:
+        if (
+            from_checkpoint is None
+            and from_hf_model is None
+            and not model_limits.supports_vision
+        ):
             price_estimation_result = await self.estimate_price(
                 training_file=training_file,
                 validation_file=validation_file,

{together-1.5.33 → together-1.5.35}/src/together/types/__init__.py RENAMED Viewed

@@ -7,17 +7,18 @@ from together.types.audio_speech import (
     AudioSpeechStreamChunk,
     AudioSpeechStreamEvent,
     AudioSpeechStreamResponse,
+    AudioTimestampGranularities,
     AudioTranscriptionRequest,
-    AudioTranslationRequest,
     AudioTranscriptionResponse,
+    AudioTranscriptionResponseFormat,
     AudioTranscriptionVerboseResponse,
+    AudioTranslationRequest,
     AudioTranslationResponse,
     AudioTranslationVerboseResponse,
-    AudioTranscriptionResponseFormat,
-    AudioTimestampGranularities,
     ModelVoices,
     VoiceListResponse,
 )
+from together.types.batch import BatchEndpoint, BatchJob, BatchJobStatus
 from together.types.chat_completions import (
     ChatCompletionChunk,
     ChatCompletionRequest,
@@ -31,6 +32,19 @@ from together.types.completions import (
 )
 from together.types.embeddings import EmbeddingRequest, EmbeddingResponse
 from together.types.endpoints import Autoscaling, DedicatedEndpoint, ListEndpoint
+from together.types.evaluation import (
+    ClassifyParameters,
+    CompareParameters,
+    EvaluationCreateResponse,
+    EvaluationJob,
+    EvaluationRequest,
+    EvaluationStatus,
+    EvaluationStatusResponse,
+    EvaluationType,
+    JudgeModelConfig,
+    ModelRequest,
+    ScoreParameters,
+)
 from together.types.files import (
     FileDeleteResponse,
     FileList,
@@ -41,49 +55,32 @@ from together.types.files import (
     FileType,
 )
 from together.types.finetune import (
-    TrainingMethodDPO,
-    TrainingMethodSFT,
-    FinetuneCheckpoint,
     CosineLRScheduler,
     CosineLRSchedulerArgs,
+    FinetuneCheckpoint,
+    FinetuneDeleteResponse,
     FinetuneDownloadResult,
-    LinearLRScheduler,
-    LinearLRSchedulerArgs,
-    FinetuneLRScheduler,
     FinetuneList,
     FinetuneListEvents,
-    FinetuneRequest,
-    FinetuneResponse,
+    FinetuneLRScheduler,
+    FinetuneMultimodalParams,
     FinetunePriceEstimationRequest,
     FinetunePriceEstimationResponse,
-    FinetuneDeleteResponse,
+    FinetuneRequest,
+    FinetuneResponse,
     FinetuneTrainingLimits,
     FullTrainingType,
+    LinearLRScheduler,
+    LinearLRSchedulerArgs,
     LoRATrainingType,
+    TrainingMethodDPO,
+    TrainingMethodSFT,
     TrainingType,
 )
 from together.types.images import ImageRequest, ImageResponse
 from together.types.models import ModelObject, ModelUploadRequest, ModelUploadResponse
 from together.types.rerank import RerankRequest, RerankResponse
-from together.types.batch import BatchJob, BatchJobStatus, BatchEndpoint
-from together.types.evaluation import (
-    EvaluationType,
-    EvaluationStatus,
-    JudgeModelConfig,
-    ModelRequest,
-    ClassifyParameters,
-    ScoreParameters,
-    CompareParameters,
-    EvaluationRequest,
-    EvaluationCreateResponse,
-    EvaluationJob,
-    EvaluationStatusResponse,
-)
-from together.types.videos import (
-    CreateVideoBody,
-    CreateVideoResponse,
-    VideoJob,
-)
+from together.types.videos import CreateVideoBody, CreateVideoResponse, VideoJob
 __all__ = [
@@ -131,6 +128,7 @@ __all__ = [
     "RerankRequest",
     "RerankResponse",
     "FinetuneTrainingLimits",
+    "FinetuneMultimodalParams",
     "AudioSpeechRequest",
     "AudioResponseFormat",
     "AudioLanguage",

{together-1.5.33 → together-1.5.35}/src/together/types/finetune.py RENAMED Viewed

@@ -1,14 +1,12 @@
 from __future__ import annotations
 from enum import Enum
-from typing import List, Literal, Any
+from typing import Any, List, Literal
 from pydantic import Field, StrictBool, field_validator
 from together.types.abstract import BaseModel
-from together.types.common import (
-    ObjectType,
-)
+from together.types.common import ObjectType
 class FinetuneJobStatus(str, Enum):
@@ -175,6 +173,14 @@ class TrainingMethodDPO(TrainingMethod):
     simpo_gamma: float | None = None
+class FinetuneMultimodalParams(BaseModel):
+    """
+    Multimodal parameters
+    """
+    train_vision: bool = False
 class FinetuneProgress(BaseModel):
     """
     Fine-tune job progress
@@ -231,6 +237,8 @@ class FinetuneRequest(BaseModel):
     )
     # from step
     from_checkpoint: str | None = None
+    # multimodal parameters
+    multimodal_params: FinetuneMultimodalParams | None = None
     # hf related fields
     hf_api_token: str | None = None
     hf_output_repo_name: str | None = None
@@ -278,6 +286,7 @@ class FinetuneResponse(BaseModel):
     # created/updated datetime stamps
     created_at: str | None = None
     updated_at: str | None = None
+    started_at: str | None = None
     # job status
     status: FinetuneJobStatus | None = None
     # job id
@@ -313,6 +322,8 @@ class FinetuneResponse(BaseModel):
     training_file_size: int | None = Field(None, alias="TrainingFileSize")
     train_on_inputs: StrictBool | Literal["auto"] | None = "auto"
     from_checkpoint: str | None = None
+    # multimodal parameters
+    multimodal_params: FinetuneMultimodalParams | None = None
     progress: FinetuneProgress | None = None
@@ -409,6 +420,7 @@ class FinetuneTrainingLimits(BaseModel):
     min_learning_rate: float
     full_training: FinetuneFullTrainingLimits | None = None
     lora_training: FinetuneLoraTrainingLimits | None = None
+    supports_vision: bool = False
 class LinearLRSchedulerArgs(BaseModel):

{together-1.5.33 → together-1.5.35}/src/together/utils/files.py RENAMED Viewed

@@ -1,8 +1,8 @@
 from __future__ import annotations
+import csv
 import json
 import os
-import csv
 from pathlib import Path
 from traceback import format_exc
 from typing import Any, Dict, List
@@ -10,18 +10,30 @@ from typing import Any, Dict, List
 from tqdm import tqdm
 from together.constants import (
+    JSONL_REQUIRED_COLUMNS_MAP,
+    MAX_BASE64_IMAGE_LENGTH,
     MAX_FILE_SIZE_GB,
+    MAX_IMAGES_PER_EXAMPLE,
     MIN_SAMPLES,
     NUM_BYTES_IN_GB,
     PARQUET_EXPECTED_COLUMNS,
-    JSONL_REQUIRED_COLUMNS_MAP,
-    REQUIRED_COLUMNS_MESSAGE,
     POSSIBLE_ROLES_CONVERSATION,
+    REQUIRED_COLUMNS_MESSAGE,
     DatasetFormat,
 )
 from together.types import FilePurpose
+# MessageContent is a string or a list of dicts with 'type': 'text' or 'image_url', and 'text' or 'image_url.url'
+# Example: "Hello" or [
+#   {"type": "text", "text": "Hello"},
+#   {"type": "image_url", "image_url": {
+#     "url": "data:image/jpeg;base64,..."
+#   }}
+# ]
+MessageContent = str | list[dict[str, Any]]
 class InvalidFileFormatError(ValueError):
     """Exception raised for invalid file formats during file checks."""
@@ -70,7 +82,7 @@ def check_file(
     if file_size > MAX_FILE_SIZE_GB * NUM_BYTES_IN_GB:
         report_dict["message"] = (
-            f"Maximum supported file size is {MAX_FILE_SIZE_GB} GB. Found file with size of {round(file_size / NUM_BYTES_IN_GB ,3)} GB."
+            f"Maximum supported file size is {MAX_FILE_SIZE_GB} GB. Found file with size of {round(file_size / NUM_BYTES_IN_GB, 3)} GB."
         )
         report_dict["is_check_passed"] = False
     elif file_size == 0:
@@ -103,7 +115,9 @@ def check_file(
     return report_dict
-def _check_conversation_type(messages: List[Dict[str, str | bool]], idx: int) -> None:
+def _check_conversation_type(
+    messages: List[Dict[str, str | int | MessageContent]], idx: int
+) -> None:
     """Check that the conversation has correct type.
     Args:
@@ -145,12 +159,6 @@ def _check_conversation_type(messages: List[Dict[str, str | bool]], idx: int) ->
                     line_number=idx + 1,
                     error_source="key_value",
                 )
-            if not isinstance(message[column], str):
-                raise InvalidFileFormatError(
-                    message=f"Column `{column}` is not a string on line {idx + 1}. Found {type(message[column])}",
-                    line_number=idx + 1,
-                    error_source="text_field",
-                )
 def _check_conversation_roles(
@@ -175,7 +183,9 @@ def _check_conversation_roles(
         )
-def _check_message_weight(message: Dict[str, str | bool], idx: int) -> None:
+def _check_message_weight(
+    message: Dict[str, str | int | MessageContent], idx: int
+) -> int | None:
     """Check that the message has a weight with the correct type and value.
     Args:
@@ -199,11 +209,14 @@ def _check_message_weight(message: Dict[str, str | bool], idx: int) -> None:
                 line_number=idx + 1,
                 error_source="key_value",
             )
+        return weight
+    return None
 def _check_message_role(
-    message: Dict[str, str | bool], previous_role: str | None, idx: int
-) -> str | bool:
+    message: Dict[str, str | int | MessageContent], previous_role: str | None, idx: int
+) -> str:
     """Check that the message has correct roles.
     Args:
@@ -217,6 +230,14 @@ def _check_message_role(
     Raises:
         InvalidFileFormatError: If the message role is invalid.
     """
+    if not isinstance(message["role"], str):
+        raise InvalidFileFormatError(
+            message=f"Invalid role `{message['role']}` in conversation on line {idx + 1}. "
+            f"Role must be a string. Found {type(message['role'])}",
+            line_number=idx + 1,
+            error_source="key_value",
+        )
     if message["role"] not in POSSIBLE_ROLES_CONVERSATION:
         raise InvalidFileFormatError(
             message=f"Invalid role `{message['role']}` in conversation on line {idx + 1}. "
@@ -234,8 +255,134 @@ def _check_message_role(
     return message["role"]
+def _check_message_content(
+    message_content: str | int | MessageContent, role: str, idx: int
+) -> tuple[bool, int]:
+    """Check that the message content has the correct type.
+    Message content can be either a) a string or b) an OpenAI-style multimodal list of content items
+    Example:
+        a) "Hello", or
+        b) [
+             {"type": "text", "text": "Hello"},
+             {"type": "image_url", "image_url": {
+                "url": "data:image/jpeg;base64,..."
+             }}
+           ]
+    Args:
+        message: The message to check.
+        role: The role of the message.
+        idx: Line number in the file.
+    Returns:
+        tuple[bool, int]: A tuple with message is multimodal and the number of images in the message content.
+    """
+    # Text-only message content
+    if isinstance(message_content, str):
+        return False, 0
+    # Multimodal message content
+    if isinstance(message_content, list):
+        num_images = 0
+        for item in message_content:
+            if not isinstance(item, dict):
+                raise InvalidFileFormatError(
+                    "The dataset is malformed, the `content` field must be a list of dicts.",
+                    line_number=idx + 1,
+                    error_source="key_value",
+                )
+            if "type" not in item:
+                raise InvalidFileFormatError(
+                    "The dataset is malformed, the `content` field must be a list of dicts with a `type` field.",
+                    line_number=idx + 1,
+                    error_source="key_value",
+                )
+            if item["type"] == "text":
+                if "text" not in item or not isinstance(item["text"], str):
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, the `text` field must be present in the `content` item field and be"
+                        f" a string. Got '{item.get('text')!r}' instead.",
+                        line_number=idx + 1,
+                        error_source="key_value",
+                    )
+            elif item["type"] == "image_url":
+                if role != "user":
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, only user messages can contain images.",
+                        line_number=idx + 1,
+                        error_source="key_value",
+                    )
+                if "image_url" not in item or not isinstance(item["image_url"], dict):
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, the `image_url` field must be present in the `content` field and "
+                        f"be a dictionary. Got {item.get('image_url')!r} instead.",
+                        line_number=idx + 1,
+                        error_source="key_value",
+                    )
+                image_data = item["image_url"].get("url")
+                if not image_data or not isinstance(image_data, str):
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, the `url` field must be present in the `image_url` field and be "
+                        f"a string. Got {image_data!r} instead.",
+                        line_number=idx + 1,
+                        error_source="key_value",
+                    )
+                if not any(
+                    image_data.startswith(f"data:image/{fmt};base64,")
+                    for fmt in ["jpeg", "png", "webp"]
+                ):
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, the `url` field must be either a JPEG, PNG or WEBP base64-encoded "
+                        "image in 'data:image/<format>;base64,<base64_encoded_image>' format. "
+                        f"Got '{image_data[:100]}...' instead.",
+                        line_number=idx + 1,
+                    )
+                if len(image_data) > MAX_BASE64_IMAGE_LENGTH:
+                    raise InvalidFileFormatError(
+                        "The dataset is malformed, the `url` field must contain base64-encoded image "
+                        f"that is less than 10MB, found ~{len(image_data) * 3 // 4} bytes.",
+                        line_number=idx + 1,
+                        error_source="key_value",
+                    )
+                num_images += 1
+            else:
+                raise InvalidFileFormatError(
+                    "The dataset is malformed, the `type` field must be either 'text' or 'image_url'. "
+                    f"Got {item['type']!r}.",
+                    line_number=idx + 1,
+                    error_source="key_value",
+                )
+        if num_images > MAX_IMAGES_PER_EXAMPLE:
+            raise InvalidFileFormatError(
+                f"The dataset is malformed, the `content` field must contain at most "
+                f"{MAX_IMAGES_PER_EXAMPLE} images, found {num_images}.",
+                line_number=idx + 1,
+                error_source="key_value",
+            )
+        # We still consider text-only messages in such format as multimodal, even if they don't have any images
+        # included - so we can process datasets with rather sparse images (i.e. not in each sample) consistently.
+        return True, num_images
+    raise InvalidFileFormatError(
+        f"Invalid content type on line {idx + 1} of the input file. Expected string or multimodal list of dicts, "
+        f"found {type(message_content)}",
+        line_number=idx + 1,
+        error_source="key_value",
+    )
 def validate_messages(
-    messages: List[Dict[str, str | bool]], idx: int, require_assistant_role: bool = True
+    messages: List[Dict[str, str | int | MessageContent]],
+    idx: int,
+    require_assistant_role: bool = True,
 ) -> None:
     """Validate the messages column.
@@ -249,15 +396,45 @@ def validate_messages(
     """
     _check_conversation_type(messages, idx)
-    has_weights = any("weight" in message for message in messages)
     previous_role = None
     assistant_role_exists = False
+    messages_are_multimodal: bool | None = None
+    total_number_of_images = 0
     for message in messages:
-        if has_weights:
-            _check_message_weight(message, idx)
+        message_weight = _check_message_weight(message, idx)
         previous_role = _check_message_role(message, previous_role, idx)
         assistant_role_exists |= previous_role == "assistant"
+        is_multimodal, number_of_images = _check_message_content(
+            message["content"], role=previous_role, idx=idx
+        )
+        # Multimodal validation
+        if number_of_images > 0 and message_weight is not None and message_weight != 0:
+            raise InvalidFileFormatError(
+                "Messages with images cannot have non-zero weights.",
+                line_number=idx + 1,
+                error_source="key_value",
+            )
+        if messages_are_multimodal is None:
+            # Detect the format of the messages in the conversation.
+            messages_are_multimodal = is_multimodal
+        elif messages_are_multimodal != is_multimodal:
+            # Due to the format limitation, we cannot mix multimodal and text only messages in the same sample.
+            raise InvalidFileFormatError(
+                "Messages in the conversation must be either all in multimodal or all in text-only format.",
+                line_number=idx + 1,
+                error_source="key_value",
+            )
+        total_number_of_images += number_of_images
+    if total_number_of_images > MAX_IMAGES_PER_EXAMPLE:
+        raise InvalidFileFormatError(
+            f"The dataset is malformed, the `messages` must contain at most {MAX_IMAGES_PER_EXAMPLE} images. "
+            f"Found {total_number_of_images} images.",
+            line_number=idx + 1,
+            error_source="key_value",
+        )
     _check_conversation_roles(require_assistant_role, assistant_role_exists, idx)
@@ -347,12 +524,7 @@ def validate_preference_openai(example: Dict[str, Any], idx: int = 0) -> None:
                 error_source="key_value",
             )
-        if not isinstance(example[key][0]["content"], str):
-            raise InvalidFileFormatError(
-                message=f"The dataset is malformed, the 'content' field in `{key}` must be a string on line {idx + 1}.",
-                line_number=idx + 1,
-                error_source="key_value",
-            )
+        _check_message_content(example[key][0]["content"], role="assistant", idx=idx)
 def _check_utf8(file: Path) -> Dict[str, Any]:
@@ -454,8 +626,7 @@ def _check_csv(file: Path, purpose: FilePurpose | str) -> Dict[str, Any]:
             report_dict["load_csv"] = False
             if idx < 0:
                 report_dict["message"] = (
-                    "Unable to decode file. "
-                    "File may be empty or in an unsupported format. "
+                    "Unable to decode file. File may be empty or in an unsupported format. "
                 )
             else:
                 report_dict["message"] = (
@@ -542,13 +713,10 @@ def _check_jsonl(file: Path, purpose: FilePurpose | str) -> Dict[str, Any]:
                         )
                     else:
                         for column in JSONL_REQUIRED_COLUMNS_MAP[current_format]:
-                            if not isinstance(json_line[column], str):
-                                raise InvalidFileFormatError(
-                                    message=f'Invalid value type for "{column}" key on line {idx + 1}. '
-                                    f"Expected string. Found {type(json_line[column])}.",
-                                    line_number=idx + 1,
-                                    error_source="key_value",
-                                )
+                            role = "assistant" if column in {"completion"} else "user"
+                            _check_message_content(
+                                json_line[column], role=role, idx=idx
+                            )
                     if dataset_format is None:
                         dataset_format = current_format
@@ -578,8 +746,7 @@ def _check_jsonl(file: Path, purpose: FilePurpose | str) -> Dict[str, Any]:
             report_dict["load_json"] = False
             if idx < 0:
                 report_dict["message"] = (
-                    "Unable to decode file. "
-                    "File may be empty or in an unsupported format. "
+                    "Unable to decode file. File may be empty or in an unsupported format. "
                 )
             else:
                 report_dict["message"] = (

{together-1.5.33 → together-1.5.35}/LICENSE RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/README.md RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/abstract/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/abstract/api_requestor.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/chat.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/completions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/evaluation.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/files.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/images.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/api/models.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/cli/cli.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/client.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/error.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/filemanager.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/base.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/complete.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/embeddings.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/files.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/finetune.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/images.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/legacy/models.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/audio/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/audio/speech.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/audio/transcriptions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/audio/translations.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/audio/voices.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/batch.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/chat/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/chat/completions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/code_interpreter.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/completions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/embeddings.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/evaluation.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/files.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/images.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/models.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/rerank.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/resources/videos.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/together_response.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/abstract.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/audio_speech.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/batch.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/chat_completions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/code_interpreter.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/common.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/completions.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/embeddings.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/endpoints.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/error.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/evaluation.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/files.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/images.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/models.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/rerank.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/types/videos.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/utils/__init__.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/utils/_log.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/utils/api_helpers.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/utils/tools.py RENAMED Viewed

File without changes

{together-1.5.33 → together-1.5.35}/src/together/version.py RENAMED Viewed

File without changes

together 1.5.33__tar.gz → 1.5.35__tar.gz

together 1.5.33tar.gz → 1.5.35tar.gz