PyPI - gllm-inference-binary - Versions diffs - 0.5.41__cp311-cp311-macosx_13_0_x86_64.whl → 0.5.44__cp311-cp311-macosx_13_0_x86_64.whl - Mend

gllm-inference-binary 0.5.41__cp311-cp311-macosx_13_0_x86_64.whl → 0.5.44__cp311-cp311-macosx_13_0_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of gllm-inference-binary might be problematic. Click here for more details.

Files changed (20) hide show

gllm_inference/builder/build_em_invoker.pyi +13 -2
gllm_inference/constants.pyi +4 -2
gllm_inference/em_invoker/__init__.pyi +3 -1
gllm_inference/em_invoker/cohere_em_invoker.pyi +128 -0
gllm_inference/em_invoker/jina_em_invoker.pyi +103 -0
gllm_inference/em_invoker/schema/cohere.pyi +20 -0
gllm_inference/em_invoker/schema/jina.pyi +28 -0
gllm_inference/exceptions/provider_error_map.pyi +1 -0
gllm_inference/lm_invoker/lm_invoker.pyi +1 -1
gllm_inference/schema/__init__.pyi +2 -2
gllm_inference/schema/activity.pyi +13 -11
gllm_inference/schema/enums.pyi +10 -0
gllm_inference/schema/events.pyi +57 -42
gllm_inference/schema/model_id.pyi +15 -0
gllm_inference.cpython-311-darwin.so +0 -0
gllm_inference.pyi +10 -6
{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/METADATA +4 -2
{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/RECORD +20 -16
{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/WHEEL +0 -0
{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/top_level.txt +0 -0

gllm_inference/builder/build_em_invoker.pyi CHANGED Viewed

@@ -1,7 +1,7 @@
 from _typeshed import Incomplete
-from gllm_inference.em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker, BedrockEMInvoker as BedrockEMInvoker, GoogleEMInvoker as GoogleEMInvoker, LangChainEMInvoker as LangChainEMInvoker, OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker, OpenAIEMInvoker as OpenAIEMInvoker, TwelveLabsEMInvoker as TwelveLabsEMInvoker, VoyageEMInvoker as VoyageEMInvoker
+from gllm_inference.em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker, BedrockEMInvoker as BedrockEMInvoker, CohereEMInvoker as CohereEMInvoker, GoogleEMInvoker as GoogleEMInvoker, JinaEMInvoker as JinaEMInvoker, LangChainEMInvoker as LangChainEMInvoker, OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker, OpenAIEMInvoker as OpenAIEMInvoker, TwelveLabsEMInvoker as TwelveLabsEMInvoker, VoyageEMInvoker as VoyageEMInvoker
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
-from gllm_inference.schema.model_id import ModelId as ModelId, ModelProvider as ModelProvider
+from gllm_inference.schema.model_id import ModelId as ModelId, ModelProvider as ModelProvider, OPTIONAL_PATH_PROVIDERS as OPTIONAL_PATH_PROVIDERS
 from typing import Any
 PROVIDER_TO_EM_INVOKER_MAP: dict[str, type[BaseEMInvoker]]
@@ -71,6 +71,16 @@ def build_em_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         ```
         Providing credentials through environment variable is not supported for Google Vertex AI.
+        # Using Jina
+        ```python
+        em_invoker = build_em_invoker(
+            model_id="jina/jina-embeddings-v2-large",
+            credentials="jina-api-key"
+        )
+        ```
+        The credentials can also be provided through the `JINA_API_KEY` environment variable. For the list of supported
+        models, please refer to the following page: https://jina.ai/models
         # Using OpenAI
         ```python
         em_invoker = build_em_invoker(
@@ -128,6 +138,7 @@ def build_em_invoker(model_id: str | ModelId, credentials: str | dict[str, Any]
         variables credentials, please refer to the following page:
         https://python.langchain.com/docs/integrations/text_embedding/
     Security warning:
         Please provide the EM invoker credentials ONLY to the `credentials` parameter. Do not put any kind of
         credentials in the `config` parameter as the content of the `config` parameter will be logged.

gllm_inference/constants.pyi CHANGED Viewed

@@ -2,10 +2,12 @@ from _typeshed import Incomplete
 AZURE_OPENAI_URL_SUFFIX: str
 DOCUMENT_MIME_TYPES: Incomplete
+EMBEDDING_ENDPOINT: str
 GOOGLE_SCOPES: Incomplete
 GRPC_ENABLE_RETRIES_KEY: str
-INVOKER_PROPAGATED_MAX_RETRIES: int
-INVOKER_DEFAULT_TIMEOUT: float
 HEX_REPR_LENGTH: int
+INVOKER_DEFAULT_TIMEOUT: float
+INVOKER_PROPAGATED_MAX_RETRIES: int
+JINA_DEFAULT_URL: str
 OPENAI_DEFAULT_URL: str
 SECONDS_TO_MILLISECONDS: int

gllm_inference/em_invoker/__init__.pyi CHANGED Viewed

@@ -1,10 +1,12 @@
 from gllm_inference.em_invoker.azure_openai_em_invoker import AzureOpenAIEMInvoker as AzureOpenAIEMInvoker
 from gllm_inference.em_invoker.bedrock_em_invoker import BedrockEMInvoker as BedrockEMInvoker
+from gllm_inference.em_invoker.cohere_em_invoker import CohereEMInvoker as CohereEMInvoker
 from gllm_inference.em_invoker.google_em_invoker import GoogleEMInvoker as GoogleEMInvoker
+from gllm_inference.em_invoker.jina_em_invoker import JinaEMInvoker as JinaEMInvoker
 from gllm_inference.em_invoker.langchain_em_invoker import LangChainEMInvoker as LangChainEMInvoker
 from gllm_inference.em_invoker.openai_compatible_em_invoker import OpenAICompatibleEMInvoker as OpenAICompatibleEMInvoker
 from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
 from gllm_inference.em_invoker.twelevelabs_em_invoker import TwelveLabsEMInvoker as TwelveLabsEMInvoker
 from gllm_inference.em_invoker.voyage_em_invoker import VoyageEMInvoker as VoyageEMInvoker
-__all__ = ['AzureOpenAIEMInvoker', 'BedrockEMInvoker', 'GoogleEMInvoker', 'LangChainEMInvoker', 'OpenAIEMInvoker', 'OpenAICompatibleEMInvoker', 'TwelveLabsEMInvoker', 'VoyageEMInvoker']
+__all__ = ['AzureOpenAIEMInvoker', 'BedrockEMInvoker', 'CohereEMInvoker', 'GoogleEMInvoker', 'JinaEMInvoker', 'LangChainEMInvoker', 'OpenAIEMInvoker', 'OpenAICompatibleEMInvoker', 'TwelveLabsEMInvoker', 'VoyageEMInvoker']

gllm_inference/em_invoker/cohere_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,128 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.cohere import CohereInputType as CohereInputType, Key as Key
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
+from gllm_inference.utils import validate_string_enum as validate_string_enum
+from typing import Any
+SUPPORTED_ATTACHMENTS: Incomplete
+MULTIMODAL_MODEL_VERSION: Incomplete
+class CohereEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with Cohere embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model (Cohere).
+        model_name (str): The name of the Cohere embedding model.
+        client (AsyncClient): The asynchronous client for the Cohere API.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+        input_type (CohereInputType): The input type for the embedding model. Supported values include:
+            1. `CohereInputType.SEARCH_DOCUMENT`,
+            2. `CohereInputType.SEARCH_QUERY`,
+            3. `CohereInputType.CLASSIFICATION`,
+            4. `CohereInputType.CLUSTERING`,
+            5. `CohereInputType.IMAGE`.
+    Initialization:
+        You can initialize the `CohereEMInvoker` as follows:
+        ```python
+        em_invoker = CohereEMInvoker(
+            model_name="embed-english-v4.0",
+            input_type="search_document"
+        )
+        ```
+        Note: The `input_type` parameter can be one of the following:
+        1. "search_document"
+        2. "search_query"
+        3. "classification"
+        4. "clustering"
+        5. "image"
+        This parameter is optional and defaults to "search_document". For more information about
+        input_type, please refer to https://docs.cohere.com/docs/embeddings#the-input_type-parameter.
+    Input types:
+        The `CohereEMInvoker` supports the following input types: text and image.
+        Non-text inputs must be passed as an `Attachment` object.
+    Output format:
+        The `CohereEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is either a text or an image.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "What animal is in this image?"
+           result = await em_invoker.invoke(text)
+           ```
+           # Example 2: Embedding an image content.
+           ```python
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke(image)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list that consists of any of the above single contents.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text = "What animal is in this image?"
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke([text, image])
+           ```
+           The above examples will return a `list[Vector]` with a size of (2, embedding_size).
+    Retry and timeout:
+        The `CohereEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=None)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=None)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = CohereEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    input_type: Incomplete
+    client: Incomplete
+    def __init__(self, model_name: str, api_key: str | None = None, base_url: str | None = None, model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None, input_type: CohereInputType = ...) -> None:
+        '''Initializes a new instance of the CohereEMInvoker class.
+        Args:
+            model_name (str): The name of the Cohere embedding model to be used.
+            api_key (str | None, optional): The API key for authenticating with Cohere. Defaults to None, in which
+                case the `COHERE_API_KEY` environment variable will be used.
+            base_url (str | None, optional): The base URL for a custom Cohere-compatible endpoint.
+                Defaults to None, in which case Cohere\'s default URL will be used.
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the Cohere client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+            input_type (CohereInputType, optional): The input type for the embedding model.
+                Defaults to `CohereInputType.SEARCH_DOCUMENT`. Valid values are: "search_document", "search_query",
+                "classification", "clustering", and "image".
+        '''

gllm_inference/em_invoker/jina_em_invoker.pyi ADDED Viewed

@@ -0,0 +1,103 @@
+from _typeshed import Incomplete
+from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import EMBEDDING_ENDPOINT as EMBEDDING_ENDPOINT, JINA_DEFAULT_URL as JINA_DEFAULT_URL
+from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.jina import InputType as InputType, Key as Key
+from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, ProviderInternalError as ProviderInternalError
+from gllm_inference.exceptions.error_parser import convert_http_status_to_base_invoker_error as convert_http_status_to_base_invoker_error
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, TruncationConfig as TruncationConfig, Vector as Vector
+from typing import Any
+SUPPORTED_ATTACHMENTS: Incomplete
+MULTIMODAL_MODELS: Incomplete
+class JinaEMInvoker(BaseEMInvoker):
+    '''An embedding model invoker to interact with Jina AI embedding models.
+    Attributes:
+        model_id (str): The model ID of the embedding model.
+        model_provider (str): The provider of the embedding model.
+        model_name (str): The name of the embedding model.
+        client (AsyncClient): The client for the Jina AI API.
+        default_hyperparameters (dict[str, Any]): Default hyperparameters for invoking the embedding model.
+        retry_config (RetryConfig): The retry configuration for the embedding model.
+        truncation_config (TruncationConfig | None): The truncation configuration for the embedding model.
+    Input types:
+        The `JinaEMInvoker` supports the following input types: text and image.
+        Non-text inputs must be passed as a `Attachment` object.
+    Output format:
+        The `JinaEMInvoker` can embed either:
+        1. A single content.
+           1. A single content is either a text or an image.
+           2. The output will be a `Vector`, representing the embedding of the content.
+           # Example 1: Embedding a text content.
+           ```python
+           text = "What animal is in this image?"
+           result = await em_invoker.invoke(text)
+           ```
+           # Example 2: Embedding an image content.
+           ```python
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke(image)
+           ```
+           The above examples will return a `Vector` with a size of (embedding_size,).
+        2. A list of contents.
+           1. A list of contents is a list that consists of any of the above single contents.
+           2. The output will be a `list[Vector]`, where each element is a `Vector` representing the
+              embedding of each single content.
+           # Example: Embedding a list of contents.
+           ```python
+           text = "What animal is in this image?"
+           image = Attachment.from_path("path/to/local/image.png")
+           result = await em_invoker.invoke([text, image])
+           ```
+           The above examples will return a `list[Vector]` with a size of (2, embedding_size).
+    Retry and timeout:
+        The `JinaEMInvoker` supports retry and timeout configuration.
+        By default, the max retries is set to 0 and the timeout is set to 30.0 seconds.
+        They can be customized by providing a custom `RetryConfig` object to the `retry_config` parameter.
+        Retry config examples:
+        ```python
+        retry_config = RetryConfig(max_retries=0, timeout=None)  # No retry, no timeout
+        retry_config = RetryConfig(max_retries=0, timeout=10.0)  # No retry, 10.0 seconds timeout
+        retry_config = RetryConfig(max_retries=5, timeout=None)  # 5 max retries, no timeout
+        retry_config = RetryConfig(max_retries=5, timeout=10.0)  # 5 max retries, 10.0 seconds timeout
+        ```
+        Usage example:
+        ```python
+        em_invoker = JinaEMInvoker(..., retry_config=retry_config)
+        ```
+    '''
+    client: Incomplete
+    model_kwargs: Incomplete
+    def __init__(self, model_name: str, api_key: str | None = None, base_url: str = ..., model_kwargs: dict[str, Any] | None = None, default_hyperparameters: dict[str, Any] | None = None, retry_config: RetryConfig | None = None, truncation_config: TruncationConfig | None = None) -> None:
+        '''Initializes a new instance of the JinaEMInvoker class.
+        Args:
+            model_name (str): The name of the Jina embedding model to be used.
+            api_key (str | None, optional): The API key for authenticating with Jina AI.
+                Defaults to None, in which case the `JINA_API_KEY` environment variable will be used.
+            base_url (str, optional): The base URL for the Jina AI API. Defaults to "https://api.jina.ai/v1".
+            model_kwargs (dict[str, Any] | None, optional): Additional keyword arguments for the HTTP client.
+                Defaults to None.
+            default_hyperparameters (dict[str, Any] | None, optional): Default hyperparameters for invoking the model.
+                Defaults to None.
+            retry_config (RetryConfig | None, optional): The retry configuration for the embedding model.
+                Defaults to None, in which case a default config with no retry and 30.0 seconds timeout will be used.
+            truncation_config (TruncationConfig | None, optional): Configuration for text truncation behavior.
+                Defaults to None, in which case no truncation is applied.
+        Raises:
+            ValueError: If neither `api_key` nor `JINA_API_KEY` environment variable is provided.
+        '''

gllm_inference/em_invoker/schema/cohere.pyi ADDED Viewed

@@ -0,0 +1,20 @@
+from enum import StrEnum
+class Key(StrEnum):
+    """Defines valid keys in Cohere."""
+    BASE_URL = 'base_url'
+    IMAGE_URL = 'image_url'
+    INPUT_TYPE = 'input_type'
+    MAX_RETRIES = 'max_retries'
+    MODEL = 'model'
+    TIMEOUT = 'timeout'
+    TYPE = 'type'
+    URL = 'url'
+class CohereInputType(StrEnum):
+    """Defines valid embedding input types for Cohere embedding API."""
+    CLASSIFICATION = 'classification'
+    CLUSTERING = 'clustering'
+    IMAGE = 'image'
+    SEARCH_DOCUMENT = 'search_document'
+    SEARCH_QUERY = 'search_query'

gllm_inference/em_invoker/schema/jina.pyi ADDED Viewed

@@ -0,0 +1,28 @@
+from enum import StrEnum
+class InputType(StrEnum):
+    """Defines the supported input types for the Jina AI embedding API."""
+    IMAGE_URL = 'image_url'
+    TEXT = 'text'
+class Key(StrEnum):
+    """Defines key constants used in the Jina AI API payloads."""
+    DATA = 'data'
+    EMBEDDING = 'embedding'
+    ERROR = 'error'
+    IMAGE_URL = 'image_url'
+    INPUT = 'input'
+    JSON = 'json'
+    MESSAGE = 'message'
+    MODEL = 'model'
+    RESPONSE = 'response'
+    STATUS = 'status'
+    TASK = 'task'
+    TEXT = 'text'
+    TYPE = 'type'
+    URL = 'url'
+class OutputType(StrEnum):
+    """Defines the expected output types returned by the Jina AI embedding API."""
+    DATA = 'data'
+    EMBEDDING = 'embedding'

gllm_inference/exceptions/provider_error_map.pyi CHANGED Viewed

@@ -13,6 +13,7 @@ class ExtendedHTTPStatus(IntEnum):
 HTTP_STATUS_TO_EXCEPTION_MAP: dict[int, type[BaseInvokerError]]
 ANTHROPIC_ERROR_MAPPING: Incomplete
 BEDROCK_ERROR_MAPPING: Incomplete
+COHERE_ERROR_MAPPING: Incomplete
 GOOGLE_ERROR_MAPPING: Incomplete
 LANGCHAIN_ERROR_CODE_MAPPING: Incomplete
 LITELLM_ERROR_MAPPING: Incomplete

gllm_inference/lm_invoker/lm_invoker.pyi CHANGED Viewed

@@ -7,7 +7,7 @@ from gllm_core.utils import RetryConfig
 from gllm_inference.constants import DOCUMENT_MIME_TYPES as DOCUMENT_MIME_TYPES, INVOKER_DEFAULT_TIMEOUT as INVOKER_DEFAULT_TIMEOUT
 from gllm_inference.exceptions import BaseInvokerError as BaseInvokerError, convert_to_base_invoker_error as convert_to_base_invoker_error
 from gllm_inference.lm_invoker.batch import BatchOperations as BatchOperations
-from gllm_inference.schema import Activity as Activity, Attachment as Attachment, AttachmentType as AttachmentType, BatchStatus as BatchStatus, LMInput as LMInput, LMOutput as LMOutput, Message as Message, MessageContent as MessageContent, MessageRole as MessageRole, ModelId as ModelId, Reasoning as Reasoning, ResponseSchema as ResponseSchema, ToolCall as ToolCall, ToolResult as ToolResult
+from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, BatchStatus as BatchStatus, LMEventType as LMEventType, LMInput as LMInput, LMOutput as LMOutput, Message as Message, MessageContent as MessageContent, MessageRole as MessageRole, ModelId as ModelId, Reasoning as Reasoning, ResponseSchema as ResponseSchema, ToolCall as ToolCall, ToolResult as ToolResult
 from langchain_core.tools import Tool as LangChainTool
 from typing import Any

gllm_inference/schema/__init__.pyi CHANGED Viewed

@@ -2,7 +2,7 @@ from gllm_inference.schema.activity import Activity as Activity, MCPCallActivity
 from gllm_inference.schema.attachment import Attachment as Attachment
 from gllm_inference.schema.code_exec_result import CodeExecResult as CodeExecResult
 from gllm_inference.schema.config import TruncationConfig as TruncationConfig
-from gllm_inference.schema.enums import AttachmentType as AttachmentType, BatchStatus as BatchStatus, EmitDataType as EmitDataType, MessageRole as MessageRole, TruncateSide as TruncateSide
+from gllm_inference.schema.enums import AttachmentType as AttachmentType, BatchStatus as BatchStatus, EmitDataType as EmitDataType, LMEventType as LMEventType, MessageRole as MessageRole, TruncateSide as TruncateSide
 from gllm_inference.schema.events import ActivityEvent as ActivityEvent, CodeEvent as CodeEvent, ThinkingEvent as ThinkingEvent
 from gllm_inference.schema.lm_input import LMInput as LMInput
 from gllm_inference.schema.lm_output import LMOutput as LMOutput
@@ -15,4 +15,4 @@ from gllm_inference.schema.tool_call import ToolCall as ToolCall
 from gllm_inference.schema.tool_result import ToolResult as ToolResult
 from gllm_inference.schema.type_alias import EMContent as EMContent, MessageContent as MessageContent, ResponseSchema as ResponseSchema, Vector as Vector
-__all__ = ['Activity', 'ActivityEvent', 'Attachment', 'AttachmentType', 'BatchStatus', 'CodeEvent', 'CodeExecResult', 'EMContent', 'EmitDataType', 'InputTokenDetails', 'LMInput', 'LMOutput', 'MCPCall', 'MCPCallActivity', 'MCPListToolsActivity', 'MCPServer', 'Message', 'MessageContent', 'MessageRole', 'ModelId', 'ModelProvider', 'OutputTokenDetails', 'Reasoning', 'ThinkingEvent', 'ResponseSchema', 'TokenUsage', 'ToolCall', 'ToolResult', 'TruncateSide', 'TruncationConfig', 'Vector', 'WebSearchActivity']
+__all__ = ['Activity', 'ActivityEvent', 'Attachment', 'AttachmentType', 'BatchStatus', 'CodeEvent', 'CodeExecResult', 'EMContent', 'EmitDataType', 'LMEventType', 'InputTokenDetails', 'LMInput', 'LMOutput', 'MCPCall', 'MCPCallActivity', 'MCPListToolsActivity', 'MCPServer', 'Message', 'MessageContent', 'MessageRole', 'ModelId', 'ModelProvider', 'OutputTokenDetails', 'Reasoning', 'ThinkingEvent', 'ResponseSchema', 'TokenUsage', 'ToolCall', 'ToolResult', 'TruncateSide', 'TruncationConfig', 'Vector', 'WebSearchActivity']

gllm_inference/schema/activity.pyi CHANGED Viewed

@@ -4,12 +4,13 @@ from pydantic import BaseModel
 from typing import Literal
 WEB_SEARCH_VISIBLE_FIELDS: Incomplete
+WebSearchActivityTypes: Incomplete
 class Activity(BaseModel):
     """Base schema for any activity.
     Attributes:
-        type (str): The type of activity being performed.
+        type (str): The type of activity being performed. Defaults to an empty string.
     """
     type: str
@@ -17,9 +18,10 @@ class MCPListToolsActivity(Activity):
     """Schema for listing tools in MCP.
     Attributes:
-        server_name (str): The name of the MCP server.
-        tools (list[dict[str, str]] | None): The tools in the MCP server.
-        type (str): The type of activity being performed.
+        type (Literal[ActivityType.MCP_LIST_TOOLS]): The type of activity being performed.
+            Defaults to ActivityType.MCP_LIST_TOOLS.
+        server_name (str): The name of the MCP server. Defaults to an empty string.
+        tools (list[dict[str, str]] | None): The tools in the MCP server. Defaults to None.
     """
     type: Literal[ActivityType.MCP_LIST_TOOLS]
     server_name: str
@@ -29,10 +31,10 @@ class MCPCallActivity(Activity):
     """Schema for MCP tool call.
     Attributes:
+        type (Literal[ActivityType.MCP_CALL]): The type of activity being performed. Defaults to ActivityType.MCP_CALL.
         server_name (str): The name of the MCP server.
         tool_name (str): The name of the tool.
         args (dict[str, str]): The arguments of the tool.
-        type (str): The type of activity being performed.
     """
     type: Literal[ActivityType.MCP_CALL]
     server_name: str
@@ -43,16 +45,16 @@ class WebSearchActivity(Activity):
     """Schema for web search tool call.
     Attributes:
-        type (str): The type of activity being performed.
-        pattern (str): The pattern of the web search.
-        url (str): The URL of the page.
-        query (str): The query of the web search.
+        type (WebSearchActivityTypes): The type of activity being performed. Defaults to ActivityType.SEARCH.
+        query (str | None): The query of the web search. Defaults to None.
+        url (str | None): The URL of the page. Defaults to None.
+        pattern (str | None): The pattern of the web search. Defaults to None.
         sources (list[dict[str, str]] | None): The sources of the web search.
     """
-    type: Literal[ActivityType.FIND_IN_PAGE, ActivityType.OPEN_PAGE, ActivityType.SEARCH]
+    type: WebSearchActivityTypes
+    query: str | None
     url: str | None
     pattern: str | None
-    query: str | None
     sources: list[dict[str, str]] | None
     def model_dump(self, *args, **kwargs) -> dict[str, str]:
         """Serialize the activity for display.

gllm_inference/schema/enums.pyi CHANGED Viewed

@@ -14,6 +14,16 @@ class BatchStatus(StrEnum):
     FINISHED = 'finished'
     UNKNOWN = 'unknown'
+class LMEventType(StrEnum):
+    """Defines event types to be emitted by the LM invoker."""
+    ACTIVITY = 'activity'
+    CODE_START = 'code_start'
+    CODE = 'code'
+    CODE_END = 'code_end'
+    THINKING_START = 'thinking_start'
+    THINKING = 'thinking'
+    THINKING_END = 'thinking_end'
 class EmitDataType(StrEnum):
     """Defines valid data types for emitting events."""
     ACTIVITY = 'activity'

gllm_inference/schema/events.pyi CHANGED Viewed

@@ -1,108 +1,123 @@
-from gllm_core.constants import EventLevel
+from _typeshed import Incomplete
 from gllm_core.schema import Event
 from gllm_inference.schema.activity import Activity as Activity
-from gllm_inference.schema.enums import EmitDataType as EmitDataType
-from typing import Literal
+from gllm_inference.schema.enums import LMEventType as LMEventType
+from typing import Any, Literal
+CodeEventType: Incomplete
+ThinkingEventType: Incomplete
 class ActivityEvent(Event):
-    """Event schema for model-triggered activities (e.g. web search, MCP).
+    """Event schema for model-triggered activities (e.g. web search, MCP call, etc.).
     Attributes:
-        id (str): The unique identifier for the activity event. Defaults to an empty string.
-        type (Literal): The type of event, always 'activity'.
-        value (Activity): The activity data containing message and type.
-        level (EventLevel): The severity level of the event. Defined through the EventLevel constants.
+        id (str): The ID of the activity event. Defaults to None.
+        value (dict[str, Any]): The value of the activity event.
+        level (EventLevel): The severity level of the activity event. Defaults to EventLevel.INFO.
+        type (Literal[EventType.ACTIVITY]): The type of the activity event. Defaults to EventType.ACTIVITY.
+        timestamp (datetime): The timestamp of the activity event. Defaults to the current timestamp.
+        metadata (dict[str, Any]): The metadata of the activity event. Defaults to an empty dictionary.
     """
-    id: str
-    type: Literal[EmitDataType.ACTIVITY]
-    value: Activity
-    level: EventLevel
+    value: dict[str, Any]
+    type: Literal[LMEventType.ACTIVITY]
+    @classmethod
+    def from_activity(cls, id_: str | None = None, activity: Activity | None = None) -> ActivityEvent:
+        """Create an activity event from an Activity object.
+        Args:
+            id_ (str | None, optional): The ID of the activity event. Defaults to None.
+            activity (Activity | None, optional): The activity object to create the event from.
+                Defaults to None, in which case the value will be an empty dictionary.
+        Returns:
+            ActivityEvent: The activity event.
+        """
 class CodeEvent(Event):
-    """Event schema for model-triggered code execution.
+    """Event schema for model-generated code to be executed.
     Attributes:
-        id (str): The unique identifier for the code event. Defaults to an empty string.
-        type (Literal): The type of event (code, code_start, or code_end).
-        value (str): The code content.
-        level (EventLevel): The severity level of the event. Defined through the EventLevel constants.
+        id (str): The ID of the code event. Defaults to None.
+        value (str): The value of the code event. Defaults to an empty string.
+        level (EventLevel): The severity level of the code event. Defaults to EventLevel.INFO.
+        type (CodeEventType): The type of the code event. Defaults to EventType.CODE.
+        timestamp (datetime): The timestamp of the code event. Defaults to the current timestamp.
+        metadata (dict[str, Any]): The metadata of the code event. Defaults to an empty dictionary.
     """
-    id: str
-    type: Literal[EmitDataType.CODE, EmitDataType.CODE_START, EmitDataType.CODE_END]
     value: str
-    level: EventLevel
+    type: CodeEventType
     @classmethod
-    def start(cls, id_: str | None = '') -> CodeEvent:
+    def start(cls, id_: str | None = None) -> CodeEvent:
         """Create a code start event.
         Args:
-            id_ (str | None): The unique identifier for the code event. Defaults to an empty string.
+            id_ (str | None, optional): The ID of the code event. Defaults to None.
         Returns:
             CodeEvent: The code start event.
         """
     @classmethod
-    def content(cls, id_: str | None = '', value: str = '') -> CodeEvent:
+    def content(cls, id_: str | None = None, value: str = '') -> CodeEvent:
         """Create a code content event.
         Args:
-            id_ (str | None): The unique identifier for the code event. Defaults to an empty string.
-            value (str): The code content.
+            id_ (str | None, optional): The ID of the code event. Defaults to None.
+            value (str, optional): The code content. Defaults to an empty string.
         Returns:
             CodeEvent: The code value event.
         """
     @classmethod
-    def end(cls, id_: str | None = '') -> CodeEvent:
+    def end(cls, id_: str | None = None) -> CodeEvent:
         """Create a code end event.
         Args:
-            id_ (str | None): The unique identifier for the code event. Defaults to an empty string.
+            id_ (str | None, optional): The ID of the code event. Defaults to None.
         Returns:
             CodeEvent: The code end event.
         """
 class ThinkingEvent(Event):
-    """Event schema for model thinking.
+    """Event schema for model-generated thinking.
     Attributes:
-        id (str): The unique identifier for the thinking event. Defaults to an empty string.
-        type (Literal): The type of thinking event (thinking, thinking_start, or thinking_end).
-        value (str): The thinking content or message.
-        level (EventLevel): The severity level of the event. Defined through the EventLevel constants.
+        id (str): The ID of the thinking event. Defaults to None.
+        value (str): The value of the thinking event. Defaults to an empty string.
+        level (EventLevel): The severity level of the thinking event. Defaults to EventLevel.INFO.
+        type (ThinkingEventType): The type of the thinking event. Defaults to EventType.THINKING.
+        timestamp (datetime): The timestamp of the thinking event. Defaults to the current timestamp.
+        metadata (dict[str, Any]): The metadata of the thinking event. Defaults to an empty dictionary.
     """
-    id: str
-    type: Literal[EmitDataType.THINKING, EmitDataType.THINKING_START, EmitDataType.THINKING_END]
     value: str
-    level: EventLevel
+    type: ThinkingEventType
     @classmethod
-    def start(cls, id_: str | None = '') -> ThinkingEvent:
+    def start(cls, id_: str | None = None) -> ThinkingEvent:
         """Create a thinking start event.
         Args:
-            id_ (str | None): The unique identifier for the thinking event. Defaults to an empty string.
+            id_ (str | None, optional): The ID of the thinking event. Defaults to None.
         Returns:
             ThinkingEvent: The thinking start event.
         """
     @classmethod
-    def content(cls, id_: str | None = '', value: str = '') -> ThinkingEvent:
+    def content(cls, id_: str | None = None, value: str = '') -> ThinkingEvent:
         """Create a thinking value event.
         Args:
-            id_ (str | None): The unique identifier for the thinking event. Defaults to an empty string.
-            value (str): The thinking content or message.
+            id_ (str | None, optional): The ID of the thinking event. Defaults to None.
+            value (str, optional): The thinking content or message. Defaults to an empty string.
         Returns:
             ThinkingEvent: The thinking value event.
         """
     @classmethod
-    def end(cls, id_: str | None = '') -> ThinkingEvent:
+    def end(cls, id_: str | None = None) -> ThinkingEvent:
         """Create a thinking end event.
         Args:
-            id_ (str | None): The unique identifier for the thinking event. Defaults to an empty string.
+            id_ (str | None, optional): The ID of the thinking event. Defaults to None.
         Returns:
             ThinkingEvent: The thinking end event.

gllm_inference/schema/model_id.pyi CHANGED Viewed

@@ -12,8 +12,10 @@ class ModelProvider(StrEnum):
     ANTHROPIC = 'anthropic'
     AZURE_OPENAI = 'azure-openai'
     BEDROCK = 'bedrock'
+    COHERE = 'cohere'
     DATASAUR = 'datasaur'
     GOOGLE = 'google'
+    JINA = 'jina'
     LANGCHAIN = 'langchain'
     LITELLM = 'litellm'
     OPENAI = 'openai'
@@ -45,6 +47,11 @@ class ModelId(BaseModel):
         model_id = ModelId.from_string("bedrock/us.anthropic.claude-sonnet-4-20250514-v1:0")
         ```
+        # Using Cohere
+        ```python
+        model_id = ModelId.from_string("cohere/embed-english-v3.0")
+        ```
         # Using Datasaur
         ```python
         model_id = ModelId.from_string("datasaur/https://deployment.datasaur.ai/api/deployment/teamId/deploymentId/")
@@ -55,6 +62,13 @@ class ModelId(BaseModel):
         model_id = ModelId.from_string("google/gemini-2.5-flash-lite")
         ```
+        # Using Jina
+        ```python
+        model_id = ModelId.from_string("jina/jina-embeddings-v2-large")
+        ```
+        For the list of supported models, please refer to the following page:
+        https://jina.ai/models
         # Using OpenAI
         ```python
         model_id = ModelId.from_string("openai/gpt-5-nano")
@@ -94,6 +108,7 @@ class ModelId(BaseModel):
         ```python
         model_id = ModelId.from_string("langchain/langchain_openai.ChatOpenAI:gpt-4o-mini")
         ```
         For the list of supported providers, please refer to the following table:
         https://python.langchain.com/docs/integrations/chat/#featured-providers

gllm_inference.cpython-311-darwin.so CHANGED Viewed

Binary file

gllm_inference.pyi CHANGED Viewed

@@ -14,7 +14,9 @@ import gllm_core
 import gllm_core.utils
 import gllm_inference.em_invoker.AzureOpenAIEMInvoker
 import gllm_inference.em_invoker.BedrockEMInvoker
+import gllm_inference.em_invoker.CohereEMInvoker
 import gllm_inference.em_invoker.GoogleEMInvoker
+import gllm_inference.em_invoker.JinaEMInvoker
 import gllm_inference.em_invoker.LangChainEMInvoker
 import gllm_inference.em_invoker.OpenAICompatibleEMInvoker
 import gllm_inference.em_invoker.OpenAIEMInvoker
@@ -50,16 +52,21 @@ import gllm_inference.exceptions.BaseInvokerError
 import gllm_inference.exceptions.convert_http_status_to_base_invoker_error
 import gllm_inference.schema.Vector
 import aioboto3
-import asyncio.CancelledError
-import gllm_inference.exceptions.convert_to_base_invoker_error
+import base64
 import gllm_inference.schema.Attachment
 import gllm_inference.schema.AttachmentType
 import gllm_inference.schema.EMContent
+import gllm_inference.utils.validate_string_enum
+import cohere
+import asyncio.CancelledError
+import gllm_inference.exceptions.convert_to_base_invoker_error
 import gllm_inference.schema.TruncateSide
 import google
 import google.auth
 import google.genai
 import google.genai.types
+import httpx
+import gllm_inference.exceptions.ProviderInternalError
 import concurrent
 import concurrent.futures
 import concurrent.futures.ThreadPoolExecutor
@@ -71,9 +78,7 @@ import gllm_inference.utils.load_langchain_model
 import gllm_inference.utils.parse_model_data
 import openai
 import io
-import httpx
 import twelvelabs
-import base64
 import sys
 import voyageai
 import voyageai.client_async
@@ -109,9 +114,8 @@ import inspect
 import time
 import jsonschema
 import gllm_inference.lm_invoker.batch.BatchOperations
-import gllm_inference.schema.Activity
+import gllm_inference.schema.LMEventType
 import gllm_inference.schema.MessageContent
-import gllm_inference.utils.validate_string_enum
 import __future__
 import gllm_inference.schema.ActivityEvent
 import gllm_inference.schema.CodeEvent

{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/METADATA RENAMED Viewed

@@ -1,12 +1,12 @@
 Metadata-Version: 2.2
 Name: gllm-inference-binary
-Version: 0.5.41
+Version: 0.5.44
 Summary: A library containing components related to model inferences in Gen AI applications.
 Author-email: Henry Wicaksono <henry.wicaksono@gdplabs.id>, Resti Febrina <resti.febrina@gdplabs.id>
 Requires-Python: <3.14,>=3.11
 Description-Content-Type: text/markdown
 Requires-Dist: poetry<3.0.0,>=2.1.3
-Requires-Dist: gllm-core-binary<0.4.0,>=0.3.0
+Requires-Dist: gllm-core-binary<0.4.0,>=0.3.21
 Requires-Dist: aiohttp<4.0.0,>=3.12.14
 Requires-Dist: filetype<2.0.0,>=1.2.0
 Requires-Dist: httpx<0.29.0,>=0.28.0
@@ -30,6 +30,8 @@ Provides-Extra: anthropic
 Requires-Dist: anthropic<0.61.0,>=0.60.0; extra == "anthropic"
 Provides-Extra: bedrock
 Requires-Dist: aioboto3<16.0.0,>=15.0.0; extra == "bedrock"
+Provides-Extra: cohere
+Requires-Dist: cohere<6.0.0,>=5.18.0; extra == "cohere"
 Provides-Extra: datasaur
 Requires-Dist: openai<2.0.0,>=1.98.0; extra == "datasaur"
 Provides-Extra: google

{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/RECORD RENAMED Viewed

@@ -1,9 +1,9 @@
-gllm_inference.cpython-311-darwin.so,sha256=VoV4hiBQlVi8zii2NE_MiJIw2GxFehwQXlKJQnLzP1g,5129744
-gllm_inference.pyi,sha256=d5iZJ3btcsBjjKRCWz639Tu8HMMIpYliPmJCNCputQY,4730
+gllm_inference.cpython-311-darwin.so,sha256=nhIC8jkaabVyzvYoCVRoT4CErxh5p7z0UVojf4-kEUM,5313240
+gllm_inference.pyi,sha256=Ue4h4rmHxeDhBKu4Ofd6wTgDBxxsFhd_CxTCvtQgZpA,4898
 gllm_inference/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-gllm_inference/constants.pyi,sha256=uCf0Rc8GkKwUKeMC5wx5WG_x0iV_piKhjZQl1gNffSQ,291
+gllm_inference/constants.pyi,sha256=viU-ACRbVSGvsCJ0FQmuR1yhyl-BzoHDVIWo5cwHmF0,337
 gllm_inference/builder/__init__.pyi,sha256=usz2lvfwO4Yk-ZGKXbCWG1cEr3nlQXxMNDNC-2yc1NM,500
-gllm_inference/builder/build_em_invoker.pyi,sha256=Qn8nD0XpzbZgps5FcnLIyubKlrWhHJyhy6jU-68u9oc,5628
+gllm_inference/builder/build_em_invoker.pyi,sha256=YunCB3g7gRSYVDRayjz38QCw77_el2e-0iqdOH6KS1Y,6138
 gllm_inference/builder/build_lm_invoker.pyi,sha256=3hiIurQ3TC7kEZPflJ6_byCNnEdcd5BEIz07ii4TAzY,7292
 gllm_inference/builder/build_lm_request_processor.pyi,sha256=KbQkcPa8C-yzyelht4mWLP8kDmh17itAT3tn8ZJB6pg,4144
 gllm_inference/builder/build_output_parser.pyi,sha256=_Lrq-bh1oPsb_Nwkkr_zyEUwIOMysRFZkvEtEM29LZM,936
@@ -11,11 +11,13 @@ gllm_inference/catalog/__init__.pyi,sha256=JBkPGTyiiZ30GECzJBW-mW8LekWyY2qyzal3e
 gllm_inference/catalog/catalog.pyi,sha256=a4RNG1lKv51GxQpOqh47tz-PAROMPaeP2o5XNLBSZaU,4790
 gllm_inference/catalog/lm_request_processor_catalog.pyi,sha256=WW1j8jWujnatF0c9rCk94CyobtFe3gOky2vjoGCV6nw,5424
 gllm_inference/catalog/prompt_builder_catalog.pyi,sha256=OU8k_4HbqjZEzHZlzSM3uzGQZJmM2uGD76Csqom0CEQ,3197
-gllm_inference/em_invoker/__init__.pyi,sha256=83QVCkMjS2-jMKdAvmZska4LuJ-un755lAxjuVSLZ9o,987
+gllm_inference/em_invoker/__init__.pyi,sha256=FHFR4k8RqtdMNZkda6A89tvWFtIoxF-t_NahDGeBQ2k,1199
 gllm_inference/em_invoker/azure_openai_em_invoker.pyi,sha256=fE-RZ10Leerbyqp8ISXeqdU_m0kaHdlHml_nQqwFjqY,4961
 gllm_inference/em_invoker/bedrock_em_invoker.pyi,sha256=hbKdar6Alu27gOPPASND1ptJIK1PPmj7NjgKwItnOgo,5725
+gllm_inference/em_invoker/cohere_em_invoker.pyi,sha256=LSNVGx58JdSP2YB6CziOS_v5VuSLdARVpBBWhz8t5E4,6665
 gllm_inference/em_invoker/em_invoker.pyi,sha256=KGjLiAWGIA3ziV50zMwSzx6lTVUbYspQCl4LFxqbDlY,5101
 gllm_inference/em_invoker/google_em_invoker.pyi,sha256=OgIQhT2g6g09Hqr9mc2--MjV3Ti-XuHfqLTunvcqU1k,6824
+gllm_inference/em_invoker/jina_em_invoker.pyi,sha256=WZJ8BeaqxrAGMrUtIEUy3itcOEzvRQYEwe0gazIv6ng,5651
 gllm_inference/em_invoker/langchain_em_invoker.pyi,sha256=BhZjkYZoxQXPJjP0PgA8W0xrtwiqDkW5E6NpGit0h1E,3498
 gllm_inference/em_invoker/openai_compatible_em_invoker.pyi,sha256=z4_jEuaprna6AJF2wXH-JgmynpVFXeb2HQZr-0ATmMw,2882
 gllm_inference/em_invoker/openai_em_invoker.pyi,sha256=tb6cXTvAGr01MMSc96mYWDqK-EK_VCdDOQ-Be0_EZfM,6195
@@ -25,7 +27,9 @@ gllm_inference/em_invoker/langchain/__init__.pyi,sha256=VYGKE5OgU0my1RlhgzkU_A7-
 gllm_inference/em_invoker/langchain/em_invoker_embeddings.pyi,sha256=VU3-Vhb9BCDhJo8PPdWHe2rBEOCs_HMXT6ZaWwjUzZE,3304
 gllm_inference/em_invoker/schema/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 gllm_inference/em_invoker/schema/bedrock.pyi,sha256=AHFW8uYOTS7RtqV1RmtY-XQK1xpMgsHxWg4RZhVgI_8,476
+gllm_inference/em_invoker/schema/cohere.pyi,sha256=UTbTtePRR1zJMsM09SiTZSZZP0IaUGaODvc7ZqH9S8c,547
 gllm_inference/em_invoker/schema/google.pyi,sha256=ovDlvinu99QJhIxMkvVUoGBEFkkEoAZhadSuk0nI9N8,181
+gllm_inference/em_invoker/schema/jina.pyi,sha256=hD7ZJeoZzg-2bhYIjxCAi7dbavbA785ezRDay7cZy7o,711
 gllm_inference/em_invoker/schema/langchain.pyi,sha256=edcUvc1IHoSMFwqV83uqWqd0U3fLhkyWQjVknvjHI8U,112
 gllm_inference/em_invoker/schema/openai.pyi,sha256=Q_dsEcodkOXYXPdrkOkW0LnuLhfeq8tEbtZAGMz2ajA,139
 gllm_inference/em_invoker/schema/openai_compatible.pyi,sha256=gmvGtsWoOMBelke_tZjC6dKimFBW9f4Vrgv0Ig0OM9Q,150
@@ -34,7 +38,7 @@ gllm_inference/em_invoker/schema/voyage.pyi,sha256=HVpor0fqNy-IwapCICfsgFmqf1FJX
 gllm_inference/exceptions/__init__.pyi,sha256=Upcuj7od2lkbdueQ0iMT2ktFYYi-KKTynTLAaxWDTjU,1214
 gllm_inference/exceptions/error_parser.pyi,sha256=IOfa--NpLUW5E9Qq0mwWi6ZpTAbUyyNe6iAqunBNGLI,1999
 gllm_inference/exceptions/exceptions.pyi,sha256=Bv996qLa_vju0Qjf4GewMxdkq8CV9LRZb0S6289DldA,5725
-gllm_inference/exceptions/provider_error_map.pyi,sha256=P1WnhWkM103FW6hqMfNZBOmYSWOmsJtll3VQV8DGb8E,1210
+gllm_inference/exceptions/provider_error_map.pyi,sha256=XPLWU42-r8MHZgg5ZkE80Gdqg3p8Z_JHvq_Na03iTqY,1243
 gllm_inference/lm_invoker/__init__.pyi,sha256=IGF3h8Z7Yr0bLrkDMRTDVPNBU6Y3liJabW3acjstJDY,1374
 gllm_inference/lm_invoker/anthropic_lm_invoker.pyi,sha256=tsO9WJRj7l4auLc2vxftMX-niWJ9dlYwUIeiTL2FtIo,16392
 gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi,sha256=6aqQdwVNLO9bDNrqcO8s75IJAN2hLSGvhO6VeDyz44w,14347
@@ -43,7 +47,7 @@ gllm_inference/lm_invoker/datasaur_lm_invoker.pyi,sha256=6DTnHsCFtGkwqVIlvmIZqKQ
 gllm_inference/lm_invoker/google_lm_invoker.pyi,sha256=vbnh9PxtEtK740QEgqk6a7sBmtuvOPQ5_1Z3UDSonR4,17338
 gllm_inference/lm_invoker/langchain_lm_invoker.pyi,sha256=NViXl_eGfFGVwLKjJ5OFdV78oay85YLgBZ8QVJGbaLA,12491
 gllm_inference/lm_invoker/litellm_lm_invoker.pyi,sha256=FHAxghha7Jfjjnty0gwgmcWRdEke_tr-54PkKc9BRUU,12404
-gllm_inference/lm_invoker/lm_invoker.pyi,sha256=e09lZeJmWA9s7pjOoogDK5mOdmMB9N8m-5_f1BqLpTE,8495
+gllm_inference/lm_invoker/lm_invoker.pyi,sha256=YfwlV5uJwwoC0uJ54qsF2PZ5eoX85kUWV14nEiBvXTM,8501
 gllm_inference/lm_invoker/openai_chat_completions_lm_invoker.pyi,sha256=zdHK-YmfplLmvwi1VASm2zvqqyLMoVSMHh2ggqaHIDA,14905
 gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi,sha256=i5pMpZf4-r_7FQ1qfsqcjpc98sI-cPiqheuTfTEKxJs,4192
 gllm_inference/lm_invoker/openai_lm_invoker.pyi,sha256=YplNfGRnLAv9puh_9hhCiQ3HbVD3XIZAkyvBR06qCpg,23019
@@ -95,18 +99,18 @@ gllm_inference/realtime_chat/output_streamer/output_streamer.pyi,sha256=GPAw1wPS
 gllm_inference/request_processor/__init__.pyi,sha256=hVnfdNZnkTBJHnmLtN3Na4ANP0yK6AstWdIizVr2Apo,227
 gllm_inference/request_processor/lm_request_processor.pyi,sha256=VnYc8E3Iayyhw-rPnGPfTKuO3ohgFsS8HPrZJeyES5I,5889
 gllm_inference/request_processor/uses_lm_mixin.pyi,sha256=Yu0XPNuHxq1tWBviHTPw1oThojneFwGHepvGjBXxKQA,6382
-gllm_inference/schema/__init__.pyi,sha256=bV9_1E-3ce6Dm6Q7xJ6TynPmxQAE1-ujfp9fkRbjI0E,2116
-gllm_inference/schema/activity.pyi,sha256=xGZbfceV8iTJcLtRJrwHfK-dYdhQRmhNwWm7KuckLh4,1974
+gllm_inference/schema/__init__.pyi,sha256=CSyh7FmQWkIasNderPd5xDptlu-CliGSzXbDV7j4KyA,2159
+gllm_inference/schema/activity.pyi,sha256=JnO2hqj91P5Tc6qb4pbkEMrHer2u5owiCvhl-igcQKQ,2303
 gllm_inference/schema/attachment.pyi,sha256=jApuzjOHJDCz4lr4MlHzBgIndh559nbWu2Xp1fk3hso,3297
 gllm_inference/schema/code_exec_result.pyi,sha256=ZTHh6JtRrPIdQ059P1UAiD2L-tAO1_S5YcMsAXfJ5A0,559
 gllm_inference/schema/config.pyi,sha256=rAL_UeXyQeXVk1P2kqd8vFWOMwmKenfpQLtvMP74t9s,674
-gllm_inference/schema/enums.pyi,sha256=5shfuJs76BqiAIZpA1wW1gXe5_KuFikQvuW3ALbQAmM,1322
-gllm_inference/schema/events.pyi,sha256=jnOrZhACkbpTCQVr_DCZfCQSuUvfuqonKDbknbwiQYw,3920
+gllm_inference/schema/enums.pyi,sha256=RkHW2GQisgHBvYQ928D6olpL6GYehv65g8uoiGVsWUM,1612
+gllm_inference/schema/events.pyi,sha256=3dJtYRuofgFDW1-kqV7PQw0WVyraEYC9je8196K-Cf8,4934
 gllm_inference/schema/lm_input.pyi,sha256=A5pjz1id6tP9XRNhzQrbmzd66C_q3gzo0UP8rCemz6Q,193
 gllm_inference/schema/lm_output.pyi,sha256=1SZi6vIWvmrZlVQ59WeQUKO5VhKrLHsSRDYslEH9d7o,2435
 gllm_inference/schema/mcp.pyi,sha256=Vwu8E2BDl6FvvnI42gIyY3Oki1BdwRE3Uh3aV0rmhQU,1014
 gllm_inference/schema/message.pyi,sha256=VP9YppKj2mo1esl9cy6qQO9m2mMHUjTmfGDdyUor880,2220
-gllm_inference/schema/model_id.pyi,sha256=y61SGPXHvQDGA9krg29pX58EE8HwLrb6XEKNo1ZNGVE,5256
+gllm_inference/schema/model_id.pyi,sha256=L2bbG6p3HyKn1naecgc8SNGBaqeH8i9CcUDgd-whP-A,5652
 gllm_inference/schema/reasoning.pyi,sha256=SlTuiDw87GdnAn-I6YOPIJRhEBiwQljM46JohG05guQ,562
 gllm_inference/schema/token_usage.pyi,sha256=1GTQVORV0dBNmD_jix8aVaUqxMKFF04KpLP7y2urqbk,2950
 gllm_inference/schema/tool_call.pyi,sha256=zQaVxCnkVxOfOEhBidqohU85gb4PRwnwBiygKaunamk,389
@@ -117,7 +121,7 @@ gllm_inference/utils/io_utils.pyi,sha256=7kUTacHAVRYoemFUOjCH7-Qmw-YsQGd6rGYxjf_
 gllm_inference/utils/langchain.pyi,sha256=VluQiHkGigDdqLUbhB6vnXiISCP5hHqV0qokYY6dC1A,1164
 gllm_inference/utils/validation.pyi,sha256=toxBtRp-VItC_X7sNi-GDd7sjibBdWMrR0q01OI2D7k,385
 gllm_inference.build/.gitignore,sha256=aEiIwOuxfzdCmLZe4oB1JsBmCUxwG8x-u-HBCV9JT8E,1
-gllm_inference_binary-0.5.41.dist-info/METADATA,sha256=N0d9DU2qIs39yjq-7Pu5V4gPVCoAR6wCS1gWMhNAK8M,5636
-gllm_inference_binary-0.5.41.dist-info/WHEEL,sha256=s8TBzVnsSJujxqbMe-G5Vh0IPlslLTnVva4BiQ75Hjo,105
-gllm_inference_binary-0.5.41.dist-info/top_level.txt,sha256=FpOjtN80F-qVNgbScXSEyqa0w09FYn6301iq6qt69IQ,15
-gllm_inference_binary-0.5.41.dist-info/RECORD,,
+gllm_inference_binary-0.5.44.dist-info/METADATA,sha256=ioEKrM2Qov6BNbvcQnR_WCkCwW8jeN4KuZNfXCjZbw4,5716
+gllm_inference_binary-0.5.44.dist-info/WHEEL,sha256=s8TBzVnsSJujxqbMe-G5Vh0IPlslLTnVva4BiQ75Hjo,105
+gllm_inference_binary-0.5.44.dist-info/top_level.txt,sha256=FpOjtN80F-qVNgbScXSEyqa0w09FYn6301iq6qt69IQ,15
+gllm_inference_binary-0.5.44.dist-info/RECORD,,

{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/WHEEL RENAMED Viewed

File without changes

{gllm_inference_binary-0.5.41.dist-info → gllm_inference_binary-0.5.44.dist-info}/top_level.txt RENAMED Viewed

File without changes