PyPI - gllm-inference-binary - Versions diffs - 0.5.9b1__cp311-cp311-macosx_10_9_universal2.macosx_13_0_x86_64.whl - Mend

gllm-inference-binary 0.5.9b1__cp311-cp311-macosx_10_9_universal2.macosx_13_0_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gllm-inference-binary might be problematic. Click here for more details.

Files changed (105) hide show

gllm_inference/__init__.pyi +0 -0
gllm_inference/builder/__init__.pyi +6 -0
gllm_inference/builder/build_em_invoker.pyi +137 -0
gllm_inference/builder/build_lm_invoker.pyi +161 -0
gllm_inference/builder/build_lm_request_processor.pyi +93 -0
gllm_inference/builder/build_output_parser.pyi +29 -0
gllm_inference/catalog/__init__.pyi +4 -0
gllm_inference/catalog/catalog.pyi +121 -0
gllm_inference/catalog/lm_request_processor_catalog.pyi +112 -0
gllm_inference/catalog/prompt_builder_catalog.pyi +82 -0
gllm_inference/constants.pyi +10 -0
gllm_inference/em_invoker/__init__.pyi +10 -0
gllm_inference/em_invoker/azure_openai_em_invoker.pyi +88 -0
gllm_inference/em_invoker/bedrock_em_invoker.pyi +106 -0
gllm_inference/em_invoker/em_invoker.pyi +90 -0
gllm_inference/em_invoker/google_em_invoker.pyi +129 -0
gllm_inference/em_invoker/langchain/__init__.pyi +3 -0
gllm_inference/em_invoker/langchain/em_invoker_embeddings.pyi +84 -0
gllm_inference/em_invoker/langchain_em_invoker.pyi +46 -0
gllm_inference/em_invoker/openai_compatible_em_invoker.pyi +96 -0
gllm_inference/em_invoker/openai_em_invoker.pyi +90 -0
gllm_inference/em_invoker/schema/__init__.pyi +0 -0
gllm_inference/em_invoker/schema/bedrock.pyi +22 -0
gllm_inference/em_invoker/schema/google.pyi +9 -0
gllm_inference/em_invoker/schema/langchain.pyi +5 -0
gllm_inference/em_invoker/schema/openai.pyi +7 -0
gllm_inference/em_invoker/schema/openai_compatible.pyi +7 -0
gllm_inference/em_invoker/schema/twelvelabs.pyi +17 -0
gllm_inference/em_invoker/schema/voyage.pyi +15 -0
gllm_inference/em_invoker/twelevelabs_em_invoker.pyi +101 -0
gllm_inference/em_invoker/voyage_em_invoker.pyi +104 -0
gllm_inference/exceptions/__init__.pyi +4 -0
gllm_inference/exceptions/error_parser.pyi +41 -0
gllm_inference/exceptions/exceptions.pyi +132 -0
gllm_inference/exceptions/provider_error_map.pyi +23 -0
gllm_inference/lm_invoker/__init__.pyi +12 -0
gllm_inference/lm_invoker/anthropic_lm_invoker.pyi +275 -0
gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi +252 -0
gllm_inference/lm_invoker/bedrock_lm_invoker.pyi +234 -0
gllm_inference/lm_invoker/datasaur_lm_invoker.pyi +166 -0
gllm_inference/lm_invoker/google_lm_invoker.pyi +317 -0
gllm_inference/lm_invoker/langchain_lm_invoker.pyi +260 -0
gllm_inference/lm_invoker/litellm_lm_invoker.pyi +248 -0
gllm_inference/lm_invoker/lm_invoker.pyi +152 -0
gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi +265 -0
gllm_inference/lm_invoker/openai_lm_invoker.pyi +362 -0
gllm_inference/lm_invoker/schema/__init__.pyi +0 -0
gllm_inference/lm_invoker/schema/anthropic.pyi +50 -0
gllm_inference/lm_invoker/schema/bedrock.pyi +53 -0
gllm_inference/lm_invoker/schema/datasaur.pyi +12 -0
gllm_inference/lm_invoker/schema/google.pyi +24 -0
gllm_inference/lm_invoker/schema/langchain.pyi +23 -0
gllm_inference/lm_invoker/schema/openai.pyi +91 -0
gllm_inference/lm_invoker/schema/openai_compatible.pyi +60 -0
gllm_inference/lm_invoker/schema/xai.pyi +31 -0
gllm_inference/lm_invoker/xai_lm_invoker.pyi +305 -0
gllm_inference/model/__init__.pyi +9 -0
gllm_inference/model/em/__init__.pyi +0 -0
gllm_inference/model/em/google_em.pyi +16 -0
gllm_inference/model/em/openai_em.pyi +15 -0
gllm_inference/model/em/twelvelabs_em.pyi +13 -0
gllm_inference/model/em/voyage_em.pyi +20 -0
gllm_inference/model/lm/__init__.pyi +0 -0
gllm_inference/model/lm/anthropic_lm.pyi +20 -0
gllm_inference/model/lm/google_lm.pyi +17 -0
gllm_inference/model/lm/openai_lm.pyi +27 -0
gllm_inference/output_parser/__init__.pyi +3 -0
gllm_inference/output_parser/json_output_parser.pyi +60 -0
gllm_inference/output_parser/output_parser.pyi +27 -0
gllm_inference/prompt_builder/__init__.pyi +3 -0
gllm_inference/prompt_builder/prompt_builder.pyi +56 -0
gllm_inference/prompt_formatter/__init__.pyi +7 -0
gllm_inference/prompt_formatter/agnostic_prompt_formatter.pyi +49 -0
gllm_inference/prompt_formatter/huggingface_prompt_formatter.pyi +55 -0
gllm_inference/prompt_formatter/llama_prompt_formatter.pyi +59 -0
gllm_inference/prompt_formatter/mistral_prompt_formatter.pyi +53 -0
gllm_inference/prompt_formatter/openai_prompt_formatter.pyi +35 -0
gllm_inference/prompt_formatter/prompt_formatter.pyi +30 -0
gllm_inference/request_processor/__init__.pyi +4 -0
gllm_inference/request_processor/lm_request_processor.pyi +101 -0
gllm_inference/request_processor/uses_lm_mixin.pyi +130 -0
gllm_inference/schema/__init__.pyi +14 -0
gllm_inference/schema/attachment.pyi +88 -0
gllm_inference/schema/code_exec_result.pyi +14 -0
gllm_inference/schema/config.pyi +15 -0
gllm_inference/schema/enums.pyi +29 -0
gllm_inference/schema/lm_output.pyi +36 -0
gllm_inference/schema/message.pyi +52 -0
gllm_inference/schema/model_id.pyi +147 -0
gllm_inference/schema/reasoning.pyi +15 -0
gllm_inference/schema/token_usage.pyi +75 -0
gllm_inference/schema/tool_call.pyi +14 -0
gllm_inference/schema/tool_result.pyi +11 -0
gllm_inference/schema/type_alias.pyi +11 -0
gllm_inference/utils/__init__.pyi +5 -0
gllm_inference/utils/io_utils.pyi +26 -0
gllm_inference/utils/langchain.pyi +30 -0
gllm_inference/utils/validation.pyi +12 -0
gllm_inference.build/.gitignore +1 -0
gllm_inference.cpython-311-darwin.so +0 -0
gllm_inference.pyi +123 -0
gllm_inference_binary-0.5.9b1.dist-info/METADATA +71 -0
gllm_inference_binary-0.5.9b1.dist-info/RECORD +105 -0
gllm_inference_binary-0.5.9b1.dist-info/WHEEL +6 -0
gllm_inference_binary-0.5.9b1.dist-info/top_level.txt +1 -0

gllm_inference/em_invoker/openai_compatible_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,96 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
+from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
+from gllm_inference.em_invoker.schema.openai_compatible import Key as Key
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig
+from typing import Any
+class OpenAICompatibleEMInvoker(OpenAIEMInvoker):
+    '''An embedding model invoker to interact with endpoints compatible with OpenAI\'s embedding API contract.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        client (AsyncOpenAI): The OpenAI client instance.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    When to use:
+        The `OpenAICompatibleEMInvoker` is designed to interact with endpoints that are compatible with OpenAI\'s
+        embedding API contract. This includes but are not limited to:
+        1. Text Embeddings Inference (https://github.com/huggingface/text-embeddings-inference)
+        2. vLLM (https://vllm.ai/)
+        When using this invoker, please note that the supported features and capabilities may vary between different
+        endpoints and language models. Using features that are not supported by the endpoint will result in an error.
+    Input types:
+        The `OpenAICompatibleEMInvoker` only supports text inputs.
+    Output format:
+        The `OpenAICompatibleEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is a single text.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "This is a text"
+           result = await em_invoker.invoke(text)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list of texts.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text1 = "This is a text"
+           text2 = "This is another text"
+           text3 = "This is yet another text"
+           result = await em_invoker.invoke([text1, text2, text3])
+           ```
+           The above examples will return a `list[Vector]` with a size of (3, embedding_size).
+    Retry and timeout:
+        The `OpenAICompatibleEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=0.0)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=0.0)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = OpenAICompatibleEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    client: Incomplete
+    def __init__(self, model_name: str, base_url: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        """Initializes a new instance of the OpenAICompatibleEMInvoker class.
+        Args:
+            model_name (str): The name of the embedding model hosted on the OpenAI compatible endpoint.
+            base_url (str): The base URL for the OpenAI compatible endpoint.
+            api_key (str | None, optional): The API key for authenticating with the OpenAI compatible endpoint.
+                Defaults to None, in which case the `OPENAI_API_KEY` environment variable will be used.
+            model_kwargs (dict[str, Any] | None, optional): Additional model parameters. Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        """

gllm_inference/em_invoker/openai_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,90 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.openai import Key as Key
+from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
+from gllm_inference.schema.config import TruncationConfig as TruncationConfig
+from typing import Any
+SUPPORTED_ATTACHMENTS: Incomplete
+class OpenAIEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with OpenAI embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        client (AsyncOpenAI): The client for the OpenAI API.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    Input types:
+        The `OpenAIEMInvoker` only supports text inputs.
+    Output format:
+        The `OpenAIEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is a single text.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "This is a text"
+           result = await em_invoker.invoke(text)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list of texts.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text1 = "This is a text"
+           text2 = "This is another text"
+           text3 = "This is yet another text"
+           result = await em_invoker.invoke([text1, text2, text3])
+           ```
+           The above examples will return a `list[Vector]` with a size of (3, embedding_size).
+    Retry and timeout:
+        The `OpenAIEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=0.0)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=0.0)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = OpenAIEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    client: Incomplete
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        """Initializes a new instance of the OpenAIEMInvoker class.
+        Args:
+            model_name (str): The name of the OpenAI embedding model to be used.
+            api_key (str | None, optional): The API key for the OpenAI API. Defaults to None, in which
+                case the `OPENAI_API_KEY` environment variable will be used.
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the OpenAI client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        """

gllm_inference/em_invoker/schema/__init__.pyi ADDED Viewed

File without changes

gllm_inference/em_invoker/schema/bedrock.pyi ADDED Viewed

@@ -0,0 +1,22 @@
+class Key:
+    """Defines valid keys in Bedrock."""
+    ACCEPT: str
+    CONTENT_TYPE: str
+    HTTP_STATUS_CODE: str
+    INPUT_TEXT: str
+    INPUT_TYPE: str
+    MODEL_ID: str
+    RESPONSE_METADATA: str
+    TEXTS: str
+class InputType:
+    """Defines valid input types in Bedrock."""
+    APPLICATION_JSON: str
+    SEARCH_DOCUMENT: str
+    SEARCH_QUERY: str
+class OutputType:
+    """Defines valid output types in Bedrock."""
+    BODY: str
+    EMBEDDING: str
+    EMBEDDINGS: str

gllm_inference/em_invoker/schema/google.pyi ADDED Viewed

@@ -0,0 +1,9 @@
+class Key:
+    """Defines valid keys in Google."""
+    API_KEY: str
+    CREDENTIALS: str
+    HTTP_OPTIONS: str
+    LOCATION: str
+    PROJECT: str
+    TIMEOUT: str
+    VERTEXAI: str

gllm_inference/em_invoker/schema/langchain.pyi ADDED Viewed

@@ -0,0 +1,5 @@
+class Key:
+    """Defines valid keys in LangChain."""
+    ERROR_CODE: str
+    MAX_RETRIES: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/openai.pyi ADDED Viewed

@@ -0,0 +1,7 @@
+class Key:
+    """Defines valid keys in OpenAI."""
+    API_KEY: str
+    BASE_URL: str
+    MAX_RETRIES: str
+    MODEL: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/openai_compatible.pyi ADDED Viewed

@@ -0,0 +1,7 @@
+class Key:
+    """Defines valid keys in OpenAI Compatible."""
+    API_KEY: str
+    BASE_URL: str
+    MAX_RETRIES: str
+    MODEL: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/twelvelabs.pyi ADDED Viewed

@@ -0,0 +1,17 @@
+class Key:
+    """Defines valid keys in TwelveLabs."""
+    INPUT_KEY: str
+    MAX_RETRIES: str
+    OUTPUT_KEY: str
+    TIMEOUT: str
+    VALUE: str
+class InputType:
+    """Defines valid input types in TwelveLabs."""
+    FILE_SUFFIX: str
+    TEXT: str
+class OutputType:
+    """Defines valid output types in TwelveLabs."""
+    EMBEDDING_SUFFIX: str
+    TEXT_EMBEDDING: str

gllm_inference/em_invoker/schema/voyage.pyi ADDED Viewed

@@ -0,0 +1,15 @@
+class Key:
+    """Defines valid keys in Voyage."""
+    API_KEY: str
+    CONTENT: str
+    IMAGE_BASE64: str
+    MAX_RETRIES: str
+    MODEL: str
+    TEXT: str
+    TIMEOUT: str
+    TYPE: str
+class InputType:
+    """Defines valid input types in Voyage."""
+    IMAGE_BASE64: str
+    TEXT: str

gllm_inference/em_invoker/twelevelabs_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,101 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.twelvelabs import InputType as InputType, Key as Key, OutputType as OutputType
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
+from typing import Any
+SUPPORTED_ATTACHMENTS: Incomplete
+class TwelveLabsEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with TwelveLabs embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        client (Client): The client for the TwelveLabs API.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    Input types:
+        The `TwelveLabsEMInvoker` supports the following input types: text, audio, and image.
+        Non-text inputs must be passed as a `Attachment` object.
+    Output format:
+        The `TwelveLabsEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is either a text, an audio, or an image.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "What animal is in this image?"
+           result = await em_invoker.invoke(text)
+           ```
+           # Example 2: Embedding an audio content.
+           ```python
+           audio = Attachment.from_path("path/to/local/audio.mp3")
+           result = await em_invoker.invoke(audio)
+           ```
+           # Example 3: Embedding an image content.
+           ```python
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke(image)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list that consists of any of the above single contents.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text = "What animal is in this image?"
+           audio = Attachment.from_path("path/to/local/audio.mp3")
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke([text, audio, image])
+           ```
+           The above examples will return a `list[Vector]` with a size of (3, embedding_size).
+    Retry and timeout:
+        The `TwelveLabsEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=0.0)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=0.0)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = TwelveLabsEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    client: Incomplete
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        """Initializes a new instance of the TwelveLabsEMInvoker class.
+        Args:
+            model_name (str): The name of the TwelveLabs embedding model to be used.
+            api_key (str | None, optional): The API key for the TwelveLabs API. Defaults to None, in which
+                case the `TWELVELABS_API_KEY` environment variable will be used.
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the TwelveLabs client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        """

gllm_inference/em_invoker/voyage_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,104 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.voyage import InputType as InputType, Key as Key
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
+from typing import Any
+SUPPORTED_ATTACHMENTS: Incomplete
+MAX_PYTHON_MINOR_VERSION: int
+class VoyageEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with Voyage embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        client (Client): The client for the Voyage API.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    Input types:
+        The `VoyageEMInvoker` supports the following input types: text, image, and a tuple containing text and image.
+        Non-text inputs must be passed as a `Attachment` object.
+    Output format:
+        The `VoyageEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is either a text, an image, or a tuple containing a text and an image.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "What animal is in this image?"
+           result = await em_invoker.invoke(text)
+           ```
+           # Example 2: Embedding an image content.
+           ```python
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke(image)
+           ```
+           # Example 3: Embedding a tuple containing a text and an image.
+           ```python
+           text = "What animal is in this image?"
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke((text, image))
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list that consists of any of the above single contents.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text = "What animal is in this image?"
+           image = Attachment.from_path("path/to/local/image.png")
+           mix_content = (text, image)
+           result = await em_invoker.invoke([text, image, mix_content])
+           ```
+           The above examples will return a `list[Vector]` with a size of (3, embedding_size).
+    Retry and timeout:
+        The `VoyageEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=0.0)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=0.0)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = VoyageEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    client: Incomplete
+    def __init__(self, model_name: str, api_key: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        """Initializes a new instance of the VoyageEMInvoker class.
+        Args:
+            model_name (str): The name of the Voyage embedding model to be used.
+            api_key (str | None, optional): The API key for the Voyage API. Defaults to None, in which
+                case the `VOYAGE_API_KEY` environment variable will be used.
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the Voyage client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        """

gllm_inference/exceptions/__init__.pyi ADDED Viewed

@@ -0,0 +1,4 @@
+from gllm_inference.exceptions.error_parser import _get_exception_key as _get_exception_key, build_debug_info as build_debug_info, convert_http_status_to_base_invoker_error as convert_http_status_to_base_invoker_error, convert_to_base_invoker_error as convert_to_base_invoker_error
+from gllm_inference.exceptions.exceptions import APIConnectionError as APIConnectionError, APITimeoutError as APITimeoutError, BaseInvokerError as BaseInvokerError, InvokerRuntimeError as InvokerRuntimeError, ModelNotFoundError as ModelNotFoundError, ProviderAuthError as ProviderAuthError, ProviderConflictError as ProviderConflictError, ProviderInternalError as ProviderInternalError, ProviderInvalidArgsError as ProviderInvalidArgsError, ProviderOverloadedError as ProviderOverloadedError, ProviderRateLimitError as ProviderRateLimitError
+__all__ = ['_get_exception_key', 'APIConnectionError', 'APITimeoutError', 'BaseInvokerError', 'InvokerRuntimeError', 'ModelNotFoundError', 'ProviderAuthError', 'ProviderConflictError', 'ProviderInternalError', 'ProviderInvalidArgsError', 'ProviderOverloadedError', 'ProviderRateLimitError', 'build_debug_info', 'convert_http_status_to_base_invoker_error', 'convert_to_base_invoker_error']

gllm_inference/exceptions/error_parser.pyi ADDED Viewed

@@ -0,0 +1,41 @@
+from gllm_inference.exceptions.exceptions import BaseInvokerError as BaseInvokerError, InvokerRuntimeError as InvokerRuntimeError
+from gllm_inference.exceptions.provider_error_map import ALL_PROVIDER_ERROR_MAPPINGS as ALL_PROVIDER_ERROR_MAPPINGS, HTTP_STATUS_TO_EXCEPTION_MAP as HTTP_STATUS_TO_EXCEPTION_MAP
+from typing import Any
+def build_debug_info(error: Any, class_name: str) -> dict[str, Any]:
+    """Build debug information for an error.
+    Args:
+        error (Any): The error to extract debug information from.
+        class_name (str): The name of the class that raised the error.
+    Returns:
+        dict[str, Any]: A dictionary containing debug information about the error.
+    """
+def convert_http_status_to_base_invoker_error(error: Exception, invoker: BaseEMInvoker | BaseLMInvoker, status_code_extractor: callable = None, provider_error_mapping: dict[str, type[BaseInvokerError]] = ...) -> BaseInvokerError:
+    """Extract provider error with HTTP status code fallback pattern.
+    This function implements the common pattern used by Bedrock and Google invokers
+    where they first try to extract HTTP status codes, then fall back to provider-specific
+    error mappings based on exception keys.
+    Args:
+        error (Exception): The error to convert.
+        invoker (BaseEMInvoker | BaseLMInvoker): The invoker instance that raised the error.
+        status_code_extractor (callable): Function to extract status code from error.
+        provider_error_mapping (dict): Provider-specific error mapping dictionary.
+    Returns:
+        BaseInvokerError: The converted error.
+    """
+def convert_to_base_invoker_error(error: Exception, invoker: BaseEMInvoker | BaseLMInvoker) -> BaseInvokerError:
+    """Convert provider error into BaseInvokerError.
+    Args:
+        error (Exception): The error to convert.
+        invoker (BaseEMInvoker | BaseLMInvoker): The invoker instance that raised the error.
+    Returns:
+        BaseInvokerError: The converted error.
+    """