PyPI - gllm-inference-binary - Versions diffs - 0.5.9__cp312-cp312-win_amd64.whl → 0.5.9b1__cp312-cp312-win_amd64.whl - Mend

gllm-inference-binary 0.5.9__cp312-cp312-win_amd64.whl → 0.5.9b1__cp312-cp312-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gllm-inference-binary might be problematic. Click here for more details.

Files changed (51) hide show

gllm_inference/builder/build_em_invoker.pyi +17 -2
gllm_inference/builder/build_lm_invoker.pyi +13 -2
gllm_inference/constants.pyi +2 -2
gllm_inference/em_invoker/__init__.pyi +2 -1
gllm_inference/em_invoker/azure_openai_em_invoker.pyi +7 -5
gllm_inference/em_invoker/bedrock_em_invoker.pyi +106 -0
gllm_inference/em_invoker/em_invoker.pyi +11 -4
gllm_inference/em_invoker/google_em_invoker.pyi +8 -3
gllm_inference/em_invoker/langchain/em_invoker_embeddings.pyi +25 -3
gllm_inference/em_invoker/langchain_em_invoker.pyi +7 -2
gllm_inference/em_invoker/openai_compatible_em_invoker.pyi +6 -2
gllm_inference/em_invoker/openai_em_invoker.pyi +5 -1
gllm_inference/em_invoker/schema/bedrock.pyi +22 -0
gllm_inference/em_invoker/schema/google.pyi +2 -0
gllm_inference/em_invoker/schema/langchain.pyi +1 -0
gllm_inference/em_invoker/twelevelabs_em_invoker.pyi +5 -3
gllm_inference/em_invoker/voyage_em_invoker.pyi +5 -2
gllm_inference/exceptions/__init__.pyi +3 -3
gllm_inference/exceptions/error_parser.pyi +26 -33
gllm_inference/exceptions/exceptions.pyi +40 -28
gllm_inference/exceptions/provider_error_map.pyi +23 -0
gllm_inference/lm_invoker/__init__.pyi +2 -1
gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi +12 -13
gllm_inference/lm_invoker/bedrock_lm_invoker.pyi +2 -0
gllm_inference/lm_invoker/google_lm_invoker.pyi +8 -1
gllm_inference/lm_invoker/langchain_lm_invoker.pyi +2 -0
gllm_inference/lm_invoker/lm_invoker.pyi +7 -6
gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi +1 -1
gllm_inference/lm_invoker/openai_lm_invoker.pyi +7 -6
gllm_inference/lm_invoker/schema/bedrock.pyi +5 -0
gllm_inference/lm_invoker/schema/langchain.pyi +1 -0
gllm_inference/lm_invoker/schema/openai.pyi +1 -0
gllm_inference/lm_invoker/schema/openai_compatible.pyi +4 -0
gllm_inference/lm_invoker/schema/xai.pyi +31 -0
gllm_inference/lm_invoker/xai_lm_invoker.pyi +305 -0
gllm_inference/request_processor/lm_request_processor.pyi +12 -3
gllm_inference/request_processor/uses_lm_mixin.pyi +109 -29
gllm_inference/schema/__init__.pyi +5 -4
gllm_inference/schema/config.pyi +15 -0
gllm_inference/schema/enums.pyi +5 -0
gllm_inference/schema/model_id.pyi +10 -1
gllm_inference/schema/token_usage.pyi +66 -2
gllm_inference/schema/type_alias.pyi +1 -5
gllm_inference/utils/__init__.pyi +2 -1
gllm_inference/utils/io_utils.pyi +26 -0
gllm_inference.cp312-win_amd64.pyd +0 -0
gllm_inference.pyi +25 -12
{gllm_inference_binary-0.5.9.dist-info → gllm_inference_binary-0.5.9b1.dist-info}/METADATA +71 -108
{gllm_inference_binary-0.5.9.dist-info → gllm_inference_binary-0.5.9b1.dist-info}/RECORD +51 -43
{gllm_inference_binary-0.5.9.dist-info → gllm_inference_binary-0.5.9b1.dist-info}/WHEEL +2 -1
gllm_inference_binary-0.5.9b1.dist-info/top_level.txt +1 -0

gllm_inference/builder/build_em_invoker.pyi CHANGED Viewed

@@ -1,5 +1,5 @@
 from _typeshed import Incomplete
-from gllm_inference.em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker, GoogleEMInvoker as GoogleEMInvoker, LangChainEMInvoker as LangChainEMInvoker, OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker, OpenAIEMInvoker as OpenAIEMInvoker, TwelveLabsEMInvoker as TwelveLabsEMInvoker, VoyageEMInvoker as VoyageEMInvoker
+from gllm_inference.em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker, BedrockEMInvoker as BedrockEMInvoker, GoogleEMInvoker as GoogleEMInvoker, LangChainEMInvoker as LangChainEMInvoker, OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker, OpenAIEMInvoker as OpenAIEMInvoker, TwelveLabsEMInvoker as TwelveLabsEMInvoker, VoyageEMInvoker as VoyageEMInvoker
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.schema.model_id import ModelId as ModelId, ModelProvider as ModelProvider
 from typing import Any
@@ -9,6 +9,7 @@ logger: Incomplete
 class Key:
     """Defines valid keys in the config."""
+    ACCESS_KEY_ID: str
     API_KEY: str
     AZURE_DEPLOYMENT: str
     AZURE_ENDPOINT: str
@@ -17,6 +18,7 @@ class Key:
     MODEL_KWARGS: str
     MODEL_NAME: str
     MODEL_CLASS_PATH: str
+    SECRET_ACCESS_KEY: str
 def build_em_invoker(model_id: str | ModelId, credentials: str | dict[str, Any] | None = None, config: dict[str, Any] | None = None) -> BaseEMInvoker:
     '''Build an embedding model invoker based on the provided configurations.
@@ -41,6 +43,19 @@ def build_em_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         ValueError: If the provider is invalid.
     Usage examples:
+        # Using Bedrock
+        ```python
+        em_invoker = build_em_invoker(
+            model_id="bedrock/cohere.embed-english-v3",
+            credentials={
+                "access_key_id": "Abc123...",
+                "secret_access_key": "Xyz123...",
+            },
+        )
+        ```
+        The credentials can also be provided through the `AWS_ACCESS_KEY_ID` and `AWS_SECRET_ACCESS_KEY`
+        environment variables.
         # Using Google Gen AI (via API key)
         ```python
         em_invoker = build_em_invoker(
@@ -71,7 +86,7 @@ def build_em_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         # Using Azure OpenAI
         ```python
         em_invoker = build_em_invoker(
-            model_id="azure-openai/https://my-resource.openai.azure.com:my-deployment",
+            model_id="azure-openai/https://my-resource.openai.azure.com/openai/v1:my-deployment",
             credentials="azure-api-key"
         )
         ```

gllm_inference/builder/build_lm_invoker.pyi CHANGED Viewed

@@ -1,5 +1,5 @@
 from _typeshed import Incomplete
-from gllm_inference.lm_invoker import AnthropicLMInvoker as AnthropicLMInvoker, AzureOpenAILMInvoker as AzureOpenAILMInvoker, BedrockLMInvoker as BedrockLMInvoker, DatasaurLMInvoker as DatasaurLMInvoker, GoogleLMInvoker as GoogleLMInvoker, LangChainLMInvoker as LangChainLMInvoker, LiteLLMLMInvoker as LiteLLMLMInvoker, OpenAICompatibleLMInvoker as OpenAICompatibleLMInvoker, OpenAILMInvoker as OpenAILMInvoker
+from gllm_inference.lm_invoker import AnthropicLMInvoker as AnthropicLMInvoker, AzureOpenAILMInvoker as AzureOpenAILMInvoker, BedrockLMInvoker as BedrockLMInvoker, DatasaurLMInvoker as DatasaurLMInvoker, GoogleLMInvoker as GoogleLMInvoker, LangChainLMInvoker as LangChainLMInvoker, LiteLLMLMInvoker as LiteLLMLMInvoker, OpenAICompatibleLMInvoker as OpenAICompatibleLMInvoker, OpenAILMInvoker as OpenAILMInvoker, XAILMInvoker as XAILMInvoker
 from gllm_inference.lm_invoker.lm_invoker import BaseLMInvoker as BaseLMInvoker
 from gllm_inference.schema.model_id import ModelId as ModelId, ModelProvider as ModelProvider
 from typing import Any
@@ -107,7 +107,7 @@ def build_lm_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         # Using Azure OpenAI
         ```python
         lm_invoker = build_lm_invoker(
-            model_id="azure-openai/https://my-resource.openai.azure.com:my-deployment",
+            model_id="azure-openai/https://my-resource.openai.azure.com/openai/v1:my-deployment",
             credentials="azure-api-key"
         )
         ```
@@ -144,6 +144,17 @@ def build_lm_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         For the list of supported providers, please refer to the following page:
         https://docs.litellm.ai/docs/providers/
+        # Using xAI
+        ```python
+        lm_invoker = build_lm_invoker(
+            model_id="xai/grok-3",
+            credentials="xai-..."
+        )
+        ```
+        The credentials can also be provided through the `XAI_API_KEY` environment variable.
+        For the list of supported models, please refer to the following page:
+        https://docs.x.ai/docs/models
     Security warning:
         Please provide the LM invoker credentials ONLY to the `credentials` parameter. Do not put any kind of
         credentials in the `config` parameter as the content of the `config` parameter will be logged.

gllm_inference/constants.pyi CHANGED Viewed

@@ -1,10 +1,10 @@
 from _typeshed import Incomplete
-DEFAULT_AZURE_OPENAI_API_VERSION: str
+AZURE_OPENAI_URL_SUFFIX: str
 DOCUMENT_MIME_TYPES: Incomplete
 GOOGLE_SCOPES: Incomplete
+GRPC_ENABLE_RETRIES_KEY: str
 INVOKER_PROPAGATED_MAX_RETRIES: int
 INVOKER_DEFAULT_TIMEOUT: float
 HEX_REPR_LENGTH: int
-HTTP_STATUS_CODE_PATTERNS: Incomplete
 SECONDS_TO_MILLISECONDS: int

gllm_inference/em_invoker/__init__.pyi CHANGED Viewed

@@ -1,4 +1,5 @@
 from gllm_inference.em_invoker.azure_openai_em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker
+from gllm_inference.em_invoker.bedrock_em_invoker import BedrockEMInvoker as BedrockEMInvoker
 from gllm_inference.em_invoker.google_em_invoker import GoogleEMInvoker as GoogleEMInvoker
 from gllm_inference.em_invoker.langchain_em_invoker import LangChainEMInvoker as LangChainEMInvoker
 from gllm_inference.em_invoker.openai_compatible_em_invoker import OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker
@@ -6,4 +7,4 @@ from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenA
 from gllm_inference.em_invoker.twelevelabs_em_invoker import TwelveLabsEMInvoker as TwelveLabsEMInvoker
 from gllm_inference.em_invoker.voyage_em_invoker import VoyageEMInvoker as VoyageEMInvoker
-__all__ = ['AzureOpenAIEMInvoker', 'GoogleEMInvoker', 'LangChainEMInvoker', 'OpenAIEMInvoker', 'OpenAICompatibleEMInvoker', 'TwelveLabsEMInvoker', 'VoyageEMInvoker']
+__all__ = ['AzureOpenAIEMInvoker', 'BedrockEMInvoker', 'GoogleEMInvoker', 'LangChainEMInvoker', 'OpenAIEMInvoker', 'OpenAICompatibleEMInvoker', 'TwelveLabsEMInvoker', 'VoyageEMInvoker']

gllm_inference/em_invoker/azure_openai_em_invoker.pyi CHANGED Viewed

@@ -1,9 +1,9 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
-from gllm_inference.constants import DEFAULT_AZURE_OPENAI_API_VERSION as DEFAULT_AZURE_OPENAI_API_VERSION, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
+from gllm_inference.constants import AZURE_OPENAI_URL_SUFFIX as AZURE_OPENAI_URL_SUFFIX, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
 from gllm_inference.em_invoker.schema.openai import Key as Key
-from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig
 from typing import Any
 class AzureOpenAIEMInvoker(OpenAIEMInvoker):
@@ -16,6 +16,7 @@ class AzureOpenAIEMInvoker(OpenAIEMInvoker):
         client (AsyncAzureOpenAI): The client for the Azure OpenAI API.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     Input types:
         The `AzureOpenAIEMInvoker` only supports text inputs.
@@ -68,7 +69,7 @@ class AzureOpenAIEMInvoker(OpenAIEMInvoker):
         ```
     '''
     client: Incomplete
-    def __init__(self, azure_endpoint: str, azure_deployment: str, api_key: str | None = None, api_version: str = ..., model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, azure_endpoint: str, azure_deployment: str, api_key: str | None = None, api_version: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the AzureOpenAIEMInvoker class.
         Args:
@@ -76,11 +77,12 @@ class AzureOpenAIEMInvoker(OpenAIEMInvoker):
             azure_deployment (str): The deployment name of the Azure OpenAI service.
             api_key (str | None, optional): The API key for authenticating with Azure OpenAI. Defaults to None, in
                 which case the `AZURE_OPENAI_API_KEY` environment variable will be used.
-            api_version (str, optional): The API version of the Azure OpenAI service. Defaults to
-                `DEFAULT_AZURE_OPENAI_API_VERSION`.
+            api_version (str | None, optional): Deprecated parameter to be removed in v0.6. Defaults to None.
             model_kwargs (dict[str, Any] | None, optional): Additional model parameters. Defaults to None.
             default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """

gllm_inference/em_invoker/bedrock_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,106 @@
+from _typeshed import Incomplete
+from enum import StrEnum
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.bedrock import InputType as InputType, Key as Key, OutputType as OutputType
+from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, convert_http_status_to_base_invoker_error as convert_http_status_to_base_invoker_error
+from gllm_inference.exceptions.provider_error_map import BEDROCK_ERROR_MAPPING as BEDROCK_ERROR_MAPPING
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
+from typing import Any
+class ModelType(StrEnum):
+    """Defines the type of the Bedrock embedding model."""
+    COHERE = 'cohere'
+    TITAN = 'titan'
+SUPPORTED_ATTACHMENTS: Incomplete
+class BedrockEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with AWS Bedrock embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        session (Session): The Bedrock client session.
+        client_kwargs (dict[str, Any]): The Bedrock client kwargs.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    Input types:
+        The `BedrockEMInvoker` only supports text inputs.
+    Output format:
+        The `BedrockEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is a single text.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "This is a text"
+           result = await em_invoker.invoke(text)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list of texts.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text1 = "This is a text"
+           text2 = "This is another text"
+           text3 = "This is yet another text"
+           result = await em_invoker.invoke([text1, text2, text3])
+           ```
+           The above examples will return a `list[Vector]` with a size of (3, embedding_size).
+    Retry and timeout:
+        The `BedrockEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=0.0)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=0.0)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = BedrockEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    session: Incomplete
+    client_kwargs: Incomplete
+    def __init__(self, model_name: str, access_key_id: str | None = None, secret_access_key: str | None = None, region_name: str = 'us-east-1', model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        '''Initializes a new instance of the BedrockEMInvoker class.
+        Args:
+            model_name (str): The name of the Bedrock embedding model to be used.
+            access_key_id (str | None, optional): The AWS access key ID. Defaults to None, in which case
+                the `AWS_ACCESS_KEY_ID` environment variable will be used.
+            secret_access_key (str | None, optional): The AWS secret access key. Defaults to None, in which case
+                the `AWS_SECRET_ACCESS_KEY` environment variable will be used.
+            region_name (str, optional): The AWS region name. Defaults to "us-east-1".
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the Bedrock client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        Raises:
+            ValueError: If the model name is not supported.
+            ValueError: If `access_key_id` or `secret_access_key` is neither provided nor set in the
+                `AWS_ACCESS_KEY_ID` or `AWS_SECRET_ACCESS_KEY` environment variables, respectively.
+        '''

gllm_inference/em_invoker/em_invoker.pyi CHANGED Viewed

@@ -3,8 +3,8 @@ from _typeshed import Incomplete
 from abc import ABC
 from gllm_core.utils.retry import RetryConfig
 from gllm_inference.constants import DOCUMENT_MIME_TYPES as DOCUMENT_MIME_TYPES, INVOKER_DEFAULT_TIMEOUT as INVOKER_DEFAULT_TIMEOUT
-from gllm_inference.exceptions import parse_error_message as parse_error_message
-from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, Vector as Vector
+from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, convert_to_base_invoker_error as convert_to_base_invoker_error
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, TruncateSide as TruncateSide, TruncationConfig as TruncationConfig, Vector as Vector
 from typing import Any
 class BaseEMInvoker(ABC, metaclass=abc.ABCMeta):
@@ -16,12 +16,17 @@ class BaseEMInvoker(ABC, metaclass=abc.ABCMeta):
         model_id (str): The model ID of the embedding model.
         model_provider (str): The provider of the embedding model.
         model_name (str): The name of the embedding model.
-        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the
+            embedding model. Defaults to None, in which case an empty dictionary is used.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+            Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+            Defaults to None, in which case no truncation is applied.
     """
     default_hyperparameters: Incomplete
     retry_config: Incomplete
-    def __init__(self, model_id: ModelId, default_hyperparameters: dict[str, Any] | None = None, supported_attachments: set[str] | None = None, retry_config: RetryConfig | None = None) -> None:
+    truncation_config: Incomplete
+    def __init__(self, model_id: ModelId, default_hyperparameters: dict[str, Any] | None = None, supported_attachments: set[str] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the BaseEMInvoker class.
         Args:
@@ -32,6 +37,8 @@ class BaseEMInvoker(ABC, metaclass=abc.ABCMeta):
                 in which case an empty set is used (indicating that no attachments are supported).
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """
     @property
     def model_id(self) -> str:

gllm_inference/em_invoker/google_em_invoker.pyi CHANGED Viewed

@@ -3,7 +3,9 @@ from gllm_core.utils.retry import RetryConfig as RetryConfig
 from gllm_inference.constants import GOOGLE_SCOPES as GOOGLE_SCOPES, SECONDS_TO_MILLISECONDS as SECONDS_TO_MILLISECONDS
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.google import Key as Key
-from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, convert_http_status_to_base_invoker_error as convert_http_status_to_base_invoker_error
+from gllm_inference.exceptions.provider_error_map import GOOGLE_ERROR_MAPPING as GOOGLE_ERROR_MAPPING
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
 from typing import Any
 SUPPORTED_ATTACHMENTS: Incomplete
@@ -17,7 +19,8 @@ class GoogleEMInvoker(BaseEMInvoker):
         model_name (str): The name of the embedding model.
         client_params (dict[str, Any]): The Google client instance init parameters.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
-        retry_config (RetryConfig | None): The retry configuration for the language model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     Initialization:
         The `GoogleEMInvoker` can use either Google Gen AI or Google Vertex AI.
@@ -98,7 +101,7 @@ class GoogleEMInvoker(BaseEMInvoker):
         ```
     '''
     client_params: Incomplete
-    def __init__(self, model_name: str, api_key: str | None = None, credentials_path: str | None = None, project_id: str | None = None, location: str = 'us-central1', model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model_name: str, api_key: str | None = None, credentials_path: str | None = None, project_id: str | None = None, location: str = 'us-central1', model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         '''Initializes a new instance of the GoogleEMInvoker class.
         Args:
@@ -117,6 +120,8 @@ class GoogleEMInvoker(BaseEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         Note:
             If neither `api_key` nor `credentials_path` is provided, Google Gen AI will be used by default.

gllm_inference/em_invoker/langchain/em_invoker_embeddings.pyi CHANGED Viewed

@@ -1,14 +1,23 @@
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
-from gllm_inference.schema import Vector as Vector
+from gllm_inference.schema import Attachment as Attachment, Vector as Vector
+from gllm_inference.utils.io_utils import DEFAULT_BASE64_ALLOWED_MIMETYPES as DEFAULT_BASE64_ALLOWED_MIMETYPES, base64_to_bytes as base64_to_bytes
 from langchain_core.embeddings import Embeddings
 from pydantic import BaseModel
 from typing import Any
 class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
-    """An adapter class that enables an `EMInvoker` to be used as a LangChain `Embeddings`.
+    '''An adapter class that enables an `EMInvoker` to be used as a LangChain `Embeddings`.
     Attributes:
         em_invoker (BaseEMInvoker): The `EMInvoker` instance to be interacted with.
+        use_base64 (bool):
+            Whether to apply strict base64 encoding to the input.
+            1, If `True`, only inputs with specific MIME types (e.g. images,
+              audio, and video) will be converted into base64 strings before being sent.
+            2. If `False`, each input is treated as a raw string.
+            This ensures "strict" handling: base64 encoding is not applied
+            universally, but only when required for those MIME types.
     Usage example:
     ```python
@@ -18,8 +27,9 @@ class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
     em_invoker = OpenAIEMInvoker(...)
     embeddings = EMInvokerEmbeddings(em_invoker=em_invoker)
     ```
-    """
+    '''
     em_invoker: BaseEMInvoker
+    use_base64: bool
     async def aembed_documents(self, texts: list[str], **kwargs: Any) -> list[Vector]:
         """Asynchronously embed documents using the `EMInvoker`.
@@ -29,6 +39,9 @@ class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
         Returns:
             list[Vector]: List of embeddings, one for each text.
+        Raises:
+            ValueError: If `texts` is not a list of strings.
         """
     async def aembed_query(self, text: str, **kwargs: Any) -> Vector:
         """Asynchronously embed query using the `EMInvoker`.
@@ -39,6 +52,9 @@ class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
         Returns:
             Vector: Embeddings for the text.
+        Raises:
+            ValueError: If `text` is not a string.
         """
     def embed_documents(self, texts: list[str], **kwargs: Any) -> list[Vector]:
         """Embed documents using the `EMInvoker`.
@@ -49,6 +65,9 @@ class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
         Returns:
             list[Vector]: List of embeddings, one for each text.
+        Raises:
+            ValueError: If `texts` is not a list of strings.
         """
     def embed_query(self, text: str, **kwargs: Any) -> Vector:
         """Embed query using the `EMInvoker`.
@@ -59,4 +78,7 @@ class EMInvokerEmbeddings(BaseModel, Embeddings, arbitrary_types_allowed=True):
         Returns:
             Vector: Embeddings for the text.
+        Raises:
+            ValueError: If `text` is not a string.
         """

gllm_inference/em_invoker/langchain_em_invoker.pyi CHANGED Viewed

@@ -3,7 +3,9 @@ from gllm_core.utils.retry import RetryConfig
 from gllm_inference.constants import INVOKER_DEFAULT_TIMEOUT as INVOKER_DEFAULT_TIMEOUT, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.langchain import Key as Key
-from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, InvokerRuntimeError as InvokerRuntimeError, build_debug_info as build_debug_info
+from gllm_inference.exceptions.provider_error_map import ALL_PROVIDER_ERROR_MAPPINGS as ALL_PROVIDER_ERROR_MAPPINGS, LANGCHAIN_ERROR_CODE_MAPPING as LANGCHAIN_ERROR_CODE_MAPPING
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
 from gllm_inference.utils import load_langchain_model as load_langchain_model, parse_model_data as parse_model_data
 from langchain_core.embeddings import Embeddings as Embeddings
 from typing import Any
@@ -19,9 +21,10 @@ class LangChainEMInvoker(BaseEMInvoker):
         model_name (str): The name of the embedding model.
         em (Embeddings): The instance to interact with an embedding model defined using LangChain's Embeddings.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     """
     model: Incomplete
-    def __init__(self, model: Embeddings | None = None, model_class_path: str | None = None, model_name: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model: Embeddings | None = None, model_class_path: str | None = None, model_name: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         '''Initializes a new instance of the LangChainEMInvoker class.
         Args:
@@ -38,4 +41,6 @@ class LangChainEMInvoker(BaseEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         '''

gllm_inference/em_invoker/openai_compatible_em_invoker.pyi CHANGED Viewed

@@ -3,7 +3,7 @@ from gllm_core.utils.retry import RetryConfig as RetryConfig
 from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
 from gllm_inference.em_invoker.schema.openai_compatible import Key as Key
-from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig
 from typing import Any
 class OpenAICompatibleEMInvoker(OpenAIEMInvoker):
@@ -16,6 +16,8 @@ class OpenAICompatibleEMInvoker(OpenAIEMInvoker):
         client (AsyncOpenAI): The OpenAI client instance.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     When to use:
         The `OpenAICompatibleEMInvoker` is designed to interact with endpoints that are compatible with OpenAI\'s
@@ -76,7 +78,7 @@ class OpenAICompatibleEMInvoker(OpenAIEMInvoker):
         ```
     '''
     client: Incomplete
-    def __init__(self, model_name: str, base_url: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model_name: str, base_url: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the OpenAICompatibleEMInvoker class.
         Args:
@@ -89,4 +91,6 @@ class OpenAICompatibleEMInvoker(OpenAIEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """

gllm_inference/em_invoker/openai_em_invoker.pyi CHANGED Viewed

@@ -4,6 +4,7 @@ from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_P
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.openai import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.schema.config import TruncationConfig as TruncationConfig
 from typing import Any
 SUPPORTED_ATTACHMENTS: Incomplete
@@ -18,6 +19,7 @@ class OpenAIEMInvoker(BaseEMInvoker):
         client (AsyncOpenAI): The client for the OpenAI API.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     Input types:
         The `OpenAIEMInvoker` only supports text inputs.
@@ -70,7 +72,7 @@ class OpenAIEMInvoker(BaseEMInvoker):
         ```
     '''
     client: Incomplete
-    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the OpenAIEMInvoker class.
         Args:
@@ -83,4 +85,6 @@ class OpenAIEMInvoker(BaseEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """

gllm_inference/em_invoker/schema/bedrock.pyi ADDED Viewed

@@ -0,0 +1,22 @@
+class Key:
+    """Defines valid keys in Bedrock."""
+    ACCEPT: str
+    CONTENT_TYPE: str
+    HTTP_STATUS_CODE: str
+    INPUT_TEXT: str
+    INPUT_TYPE: str
+    MODEL_ID: str
+    RESPONSE_METADATA: str
+    TEXTS: str
+class InputType:
+    """Defines valid input types in Bedrock."""
+    APPLICATION_JSON: str
+    SEARCH_DOCUMENT: str
+    SEARCH_QUERY: str
+class OutputType:
+    """Defines valid output types in Bedrock."""
+    BODY: str
+    EMBEDDING: str
+    EMBEDDINGS: str

gllm_inference/em_invoker/schema/google.pyi CHANGED Viewed

@@ -1,7 +1,9 @@
 class Key:
     """Defines valid keys in Google."""
+    API_KEY: str
     CREDENTIALS: str
     HTTP_OPTIONS: str
     LOCATION: str
     PROJECT: str
     TIMEOUT: str
+    VERTEXAI: str

gllm_inference/em_invoker/schema/langchain.pyi CHANGED Viewed

@@ -1,4 +1,5 @@
 class Key:
     """Defines valid keys in LangChain."""
+    ERROR_CODE: str
     MAX_RETRIES: str
     TIMEOUT: str

gllm_inference/em_invoker/twelevelabs_em_invoker.pyi CHANGED Viewed

@@ -1,9 +1,8 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
-from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.twelvelabs import InputType as InputType, Key as Key, OutputType as OutputType
-from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
 from typing import Any
 SUPPORTED_ATTACHMENTS: Incomplete
@@ -18,6 +17,7 @@ class TwelveLabsEMInvoker(BaseEMInvoker):
         client (Client): The client for the TwelveLabs API.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     Input types:
         The `TwelveLabsEMInvoker` supports the following input types: text, audio, and image.
@@ -83,7 +83,7 @@ class TwelveLabsEMInvoker(BaseEMInvoker):
         ```
     '''
     client: Incomplete
-    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the TwelveLabsEMInvoker class.
         Args:
@@ -96,4 +96,6 @@ class TwelveLabsEMInvoker(BaseEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """

gllm_inference/em_invoker/voyage_em_invoker.pyi CHANGED Viewed

@@ -3,7 +3,7 @@ from gllm_core.utils.retry import RetryConfig as RetryConfig
 from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.voyage import InputType as InputType, Key as Key
-from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
 from typing import Any
 SUPPORTED_ATTACHMENTS: Incomplete
@@ -19,6 +19,7 @@ class VoyageEMInvoker(BaseEMInvoker):
         client (Client): The client for the Voyage API.
         default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
         retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
     Input types:
         The `VoyageEMInvoker` supports the following input types: text, image, and a tuple containing text and image.
@@ -85,7 +86,7 @@ class VoyageEMInvoker(BaseEMInvoker):
         ```
     '''
     client: Incomplete
-    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None) -> None:
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
         """Initializes a new instance of the VoyageEMInvoker class.
         Args:
@@ -98,4 +99,6 @@ class VoyageEMInvoker(BaseEMInvoker):
                 Defaults to None.
             retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
                 Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
         """

gllm_inference/exceptions/__init__.pyi CHANGED Viewed

@@ -1,4 +1,4 @@
-from gllm_inference.exceptions.error_parser import ExtendedHTTPStatus as ExtendedHTTPStatus, HTTP_STATUS_TO_EXCEPTION_MAP as HTTP_STATUS_TO_EXCEPTION_MAP, extract_http_status_code as extract_http_status_code, parse_error_message as parse_error_message
-from gllm_inference.exceptions.exceptions import BaseInvokerError as BaseInvokerError, InvokerRuntimeError as InvokerRuntimeError, ModelNotFoundError as ModelNotFoundError, ProviderAuthError as ProviderAuthError, ProviderInternalError as ProviderInternalError, ProviderInvalidArgsError as ProviderInvalidArgsError, ProviderOverloadedError as ProviderOverloadedError, ProviderRateLimitError as ProviderRateLimitError
+from gllm_inference.exceptions.error_parser import _get_exception_key as _get_exception_key, build_debug_info as build_debug_info, convert_http_status_to_base_invoker_error as convert_http_status_to_base_invoker_error, convert_to_base_invoker_error as convert_to_base_invoker_error
+from gllm_inference.exceptions.exceptions import APIConnectionError as APIConnectionError, APITimeoutError as APITimeoutError, BaseInvokerError as BaseInvokerError, InvokerRuntimeError as InvokerRuntimeError, ModelNotFoundError as ModelNotFoundError, ProviderAuthError as ProviderAuthError, ProviderConflictError as ProviderConflictError, ProviderInternalError as ProviderInternalError, ProviderInvalidArgsError as ProviderInvalidArgsError, ProviderOverloadedError as ProviderOverloadedError, ProviderRateLimitError as ProviderRateLimitError
-__all__ = ['HTTP_STATUS_TO_EXCEPTION_MAP', 'BaseInvokerError', 'ExtendedHTTPStatus', 'InvokerRuntimeError', 'ModelNotFoundError', 'ProviderAuthError', 'ProviderInternalError', 'ProviderInvalidArgsError', 'ProviderOverloadedError', 'ProviderRateLimitError', 'extract_http_status_code', 'parse_error_message']
+__all__ = ['_get_exception_key', 'APIConnectionError', 'APITimeoutError', 'BaseInvokerError', 'InvokerRuntimeError', 'ModelNotFoundError', 'ProviderAuthError', 'ProviderConflictError', 'ProviderInternalError', 'ProviderInvalidArgsError', 'ProviderOverloadedError', 'ProviderRateLimitError', 'build_debug_info', 'convert_http_status_to_base_invoker_error', 'convert_to_base_invoker_error']