PyPI - gllm-inference-binary - Versions diffs - 0.5.5__cp313-cp313-manylinux_2_31_x86_64.whl → 0.5.7__cp313-cp313-manylinux_2_31_x86_64.whl - Mend

gllm-inference-binary 0.5.5__cp313-cp313-manylinux_2_31_x86_64.whl → 0.5.7__cp313-cp313-manylinux_2_31_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

gllm_inference/builder/build_lm_request_processor.pyi CHANGED Viewed

@@ -8,7 +8,7 @@ from typing import Any
 logger: Incomplete
-def build_lm_request_processor(model_id: str | ModelId, credentials: str | dict[str, Any] | None = None, config: dict[str, Any] | None = None, system_template: str = '', user_template: str = '', output_parser_type: str = 'none') -> LMRequestProcessor:
+def build_lm_request_processor(model_id: str | ModelId, credentials: str | dict[str, Any] | None = None, config: dict[str, Any] | None = None, system_template: str = '', user_template: str = '', key_defaults: dict[str, Any] | None = None, output_parser_type: str = 'none') -> LMRequestProcessor:
     '''Build a language model invoker based on the provided configurations.
     Args:
@@ -29,6 +29,9 @@ def build_lm_request_processor(model_id: str | ModelId, credentials: str | dict[
             Defaults to an empty string.
         user_template (str): The user prompt template. May contain placeholders enclosed in curly braces `{}`.
             Defaults to an empty string.
+        key_defaults (dict[str, str] | None, optional): Default values for the keys in the prompt templates.
+            Applied when the corresponding keys are not provided in the runtime input.
+            Defaults to None, in which case no default values will be assigned to the keys.
         output_parser_type (str, optional): The type of output parser to use. Supports "json" and "none".
             Defaults to "none".
@@ -63,13 +66,14 @@ def build_lm_request_processor(model_id: str | ModelId, credentials: str | dict[
         )
         ```
-        # With system template
+        # With custom prompt builder configuration
         ```python
         lm_request_processor = build_lm_request_processor(
             model_id="openai/gpt-4o-mini",
             credentials="sk-...",
-            system_template="Talk like a pirate.",
+            system_template="Talk like a {role}.",
             user_template="{query}",
+            key_defaults={"role": "pirate"},
         )
         ```

gllm_inference/catalog/lm_request_processor_catalog.pyi CHANGED Viewed

@@ -6,6 +6,7 @@ from gllm_inference.request_processor import LMRequestProcessor as LMRequestProc
 MODEL_ID_ENV_VAR_REGEX_PATTERN: str
 LM_REQUEST_PROCESSOR_REQUIRED_COLUMNS: Incomplete
 CONFIG_SCHEMA_MAP: Incomplete
+logger: Incomplete
 class LMRequestProcessorCatalog(BaseCatalog[LMRequestProcessor]):
     '''Loads multiple LM request processors from certain sources.
@@ -46,17 +47,24 @@ class LMRequestProcessorCatalog(BaseCatalog[LMRequestProcessor]):
         # Example 4: Load from record
         ```python
-        catalog = LMRequestProcessorCatalog.from_records(
-            name="...",
-            system_template="...",
-            user_template="...",
-            model_id="...",
-            credentials="...",
-            config="...",
-            output_parser_type="...",
-        )
-        lm_request_processor = catalog.name
+        records=[
+            {
+                "name": "answer_question",
+                "system_template": (
+                    "You are helpful assistant.\\n"
+                    "Answer the following question based on the provided context.\\n"
+                    "```{context}```"
+                ),
+                "user_template": "{query}",
+                "key_defaults": \'{"context": "<default context>"}\',
+                "model_id": "openai/gpt-4.1-nano",
+                "credentials": "OPENAI_API_KEY",
+                "config": "",
+                "output_parser_type": "none",
+            },
+        ]
+        catalog = LMRequestProcessorCatalog.from_records(records=records)
+        lm_request_processor = catalog.answer_question
         ```
     Template Format Example:
@@ -66,35 +74,39 @@ class LMRequestProcessorCatalog(BaseCatalog[LMRequestProcessor]):
         # Example 2: CSV
         For an example of how a CSV file can be formatted to be loaded using LMRequestProcessorCatalog, see:
-        https://drive.google.com/file/d/10nYKn_r9SVnTkaik-caMqUjX6prUZ62M/view?usp=drive_link
+        https://drive.google.com/file/d/1_2rSoxh3CR2KZxIyUmpowMrt0Lm0YqAb/view?usp=drive_link
     Template Explanation:
         The required columns are:
-            1. name (str): The name of the LM request processor.
-            2. system_template (str): The system template of the prompt builder.
-            3. user_template (str): The user template of the prompt builder.
-            4. model_id (str): The model ID of the LM invoker.
-            5. credentials (str | json_str): The credentials of the LM invoker.
-            6. config (json_str): The additional configuration of the LM invoker.
-            7. output_parser_type (str): The type of the output parser.
+        1. name (str): The name of the LM request processor.
+        2. system_template (str): The system template of the prompt builder.
+        3. user_template (str): The user template of the prompt builder.
+        4. key_defaults (json_str): The default values for the prompt template keys.
+        5. model_id (str): The model ID of the LM invoker.
+        6. credentials (str | json_str): The credentials of the LM invoker.
+        7. config (json_str): The additional configuration of the LM invoker.
+        8. output_parser_type (str): The type of the output parser.
         Important Notes:
         1. At least one of `system_template` or `user_template` must be filled.
-        2. The `model_id`:
-            2.1. Must be filled with the model ID of the LM invoker, e.g. "openai/gpt-4.1-nano".
-            2.2. Can be partially loaded from the environment variable using the "${ENV_VAR_KEY}" syntax,
+        2. `key_defaults` is optional. If filled, must be a dictionary containing the default values for the
+            prompt template keys. These default values will be applied when the corresponding keys are not provided
+            in the runtime input. If it is empty, the prompt template keys will not have default values.
+        3. The `model_id`:
+            3.1. Must be filled with the model ID of the LM invoker, e.g. "openai/gpt-4.1-nano".
+            3.2. Can be partially loaded from the environment variable using the "${ENV_VAR_KEY}" syntax,
                 e.g. "azure-openai/${AZURE_ENDPOINT}/${AZURE_DEPLOYMENT}".
-            2.3. For the available model ID formats, see: https://gdplabs.gitbook.io/sdk/resources/supported-models
-        3. `credentials` is optional. If it is filled, it can either be:
-            3.1. An environment variable name containing the API key (e.g. OPENAI_API_KEY).
-            3.2. An environment variable name containing the path to a credentials JSON file
+            3.3. For the available model ID formats, see: https://gdplabs.gitbook.io/sdk/resources/supported-models
+        4. `credentials` is optional. If it is filled, it can either be:
+            4.1. An environment variable name containing the API key (e.g. OPENAI_API_KEY).
+            4.2. An environment variable name containing the path to a credentials JSON file
                 (e.g. GOOGLE_CREDENTIALS_FILE_PATH). Currently only supported for Google Vertex AI.
-            3.3. A dictionary of credentials, with each value being an environment variable name corresponding to the
+            4.3. A dictionary of credentials, with each value being an environment variable name corresponding to the
                 credential (e.g. {"api_key": "OPENAI_API_KEY"}). Currently supported for Bedrock and LangChain.
             If it is empty, the LM invoker will use the default credentials loaded from the environment variables.
-        4. `config` is optional. If filled, must be a dictionary containing the configuration for the LM invoker.
+        5. `config` is optional. If filled, must be a dictionary containing the configuration for the LM invoker.
             If it is empty, the LM invoker will use the default configuration.
-        5. `output_parser_type` can either be:
-            5.1. none: No output parser will be used.
-            5.2. json: The JSONOutputParser will be used.
+        6. `output_parser_type` can either be:
+            6.1. none: No output parser will be used.
+            6.2. json: The JSONOutputParser will be used.
     '''

gllm_inference/catalog/prompt_builder_catalog.pyi CHANGED Viewed

@@ -3,6 +3,7 @@ from gllm_inference.catalog.catalog import BaseCatalog as BaseCatalog
 from gllm_inference.prompt_builder.prompt_builder import PromptBuilder as PromptBuilder
 PROMPT_BUILDER_REQUIRED_COLUMNS: Incomplete
+logger: Incomplete
 class PromptBuilderCatalog(BaseCatalog[PromptBuilder]):
     '''Loads multiple prompt builders from certain sources.
@@ -42,22 +43,14 @@ class PromptBuilderCatalog(BaseCatalog[PromptBuilder]):
         ```python
         records=[
             {
-                "name": "summarize",
-                "system": "You are an AI expert\\nSummarize the following context.\\n\\nContext:\\n```{context}```",
-                "user": ""
-            },
-            {
-                "name": "transform_query",
-                "system": "",
-                "user": "Transform the following query into a simpler form.\\n\\nQuery:\\n```{query}```"
-            },
-            {
-                "name": "draft_document",
+                "name": "answer_question",
                 "system": (
-                    "You are an AI expert.\\nDraft a document following the provided format and context.\\n\\n"
-                    "Format:\\n```{format}```\\n\\nContext:\\n```{context}```"
+                    "You are helpful assistant.\\n"
+                    "Answer the following question based on the provided context.\\n"
+                    "```{context}```"
                 ),
-                "user": "User instruction:\\n{query}"
+                "user": "{query}",
+                "key_defaults": \'{"context": "<default context>"}\',
             },
         ]
         catalog = PromptBuilderCatalog.from_records(records=records)
@@ -71,15 +64,19 @@ class PromptBuilderCatalog(BaseCatalog[PromptBuilder]):
         # Example 2: CSV
         For an example of how a CSV file can be formatted to be loaded using PromptBuilderCatalog, see:
-        https://drive.google.com/file/d/1CWijOk-g16ZglUn_K2bDPmbyyBDK2r0L/view?usp=drive_link
+        https://drive.google.com/file/d/1KQgddMdbcZBZmroQFtjSl-TKLohq84Fz/view?usp=drive_link
     Template explanation:
         The required columns are:
-            1. name (str): The name of the prompt builder.
-            2. system (str): The system template of the prompt builder.
-            3. user (str): The user template of the prompt builder.
+        1. name (str): The name of the prompt builder.
+        2. system (str): The system template of the prompt builder.
+        3. user (str): The user template of the prompt builder.
+        4. key_defaults (json_str): The default values for the prompt template keys.
         Important Notes:
-            1. At least one of the `system` and `user` columns must be filled.
+        1. At least one of the `system` and `user` columns must be filled.
+        2. `key_defaults` is optional. If filled, must be a dictionary containing the default values for the
+            prompt template keys. These default values will be applied when the corresponding keys are not provided
+            in the runtime input. If it is empty, the prompt template keys will not have default values.
     '''

gllm_inference/constants.pyi CHANGED Viewed

@@ -3,6 +3,7 @@ from _typeshed import Incomplete
 DEFAULT_AZURE_OPENAI_API_VERSION: str
 DOCUMENT_MIME_TYPES: Incomplete
 GOOGLE_SCOPES: Incomplete
+INVOKER_PROPAGATED_MAX_RETRIES: int
 INVOKER_DEFAULT_TIMEOUT: float
 HEX_REPR_LENGTH: int
 HTTP_STATUS_CODE_PATTERNS: Incomplete

gllm_inference/em_invoker/azure_openai_em_invoker.pyi CHANGED Viewed

@@ -1,7 +1,8 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
-from gllm_inference.constants import DEFAULT_AZURE_OPENAI_API_VERSION as DEFAULT_AZURE_OPENAI_API_VERSION
+from gllm_inference.constants import DEFAULT_AZURE_OPENAI_API_VERSION as DEFAULT_AZURE_OPENAI_API_VERSION, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
+from gllm_inference.em_invoker.schema.openai import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider
 from typing import Any

gllm_inference/em_invoker/google_em_invoker.pyi CHANGED Viewed

@@ -2,6 +2,7 @@ from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
 from gllm_inference.constants import GOOGLE_SCOPES as GOOGLE_SCOPES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.google import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
 from typing import Any

gllm_inference/em_invoker/langchain_em_invoker.pyi CHANGED Viewed

@@ -1,6 +1,8 @@
 from _typeshed import Incomplete
-from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_core.utils.retry import RetryConfig
+from gllm_inference.constants import INVOKER_DEFAULT_TIMEOUT as INVOKER_DEFAULT_TIMEOUT, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.langchain import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
 from gllm_inference.utils import load_langchain_model as load_langchain_model, parse_model_data as parse_model_data
 from langchain_core.embeddings import Embeddings as Embeddings

gllm_inference/em_invoker/openai_compatible_em_invoker.pyi CHANGED Viewed

@@ -1,6 +1,8 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.openai_em_invoker import OpenAIEMInvoker as OpenAIEMInvoker
+from gllm_inference.em_invoker.schema.openai_compatible import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider
 from typing import Any

gllm_inference/em_invoker/openai_em_invoker.pyi CHANGED Viewed

@@ -1,6 +1,8 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
+from gllm_inference.em_invoker.schema.openai import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector
 from typing import Any

gllm_inference/em_invoker/schema/google.pyi ADDED Viewed

@@ -0,0 +1,7 @@
+class Key:
+    """Defines valid keys in Google."""
+    CREDENTIALS: str
+    HTTP_OPTIONS: str
+    LOCATION: str
+    PROJECT: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/langchain.pyi ADDED Viewed

@@ -0,0 +1,4 @@
+class Key:
+    """Defines valid keys in LangChain."""
+    MAX_RETRIES: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/openai.pyi ADDED Viewed

@@ -0,0 +1,7 @@
+class Key:
+    """Defines valid keys in OpenAI."""
+    API_KEY: str
+    BASE_URL: str
+    MAX_RETRIES: str
+    MODEL: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/openai_compatible.pyi ADDED Viewed

@@ -0,0 +1,7 @@
+class Key:
+    """Defines valid keys in OpenAI Compatible."""
+    API_KEY: str
+    BASE_URL: str
+    MAX_RETRIES: str
+    MODEL: str
+    TIMEOUT: str

gllm_inference/em_invoker/schema/twelvelabs.pyi CHANGED Viewed

@@ -1,7 +1,9 @@
 class Key:
     """Defines valid keys in TwelveLabs."""
     INPUT_KEY: str
+    MAX_RETRIES: str
     OUTPUT_KEY: str
+    TIMEOUT: str
     VALUE: str
 class InputType:

gllm_inference/em_invoker/schema/voyage.pyi CHANGED Viewed

@@ -1,8 +1,12 @@
 class Key:
     """Defines valid keys in Voyage."""
+    API_KEY: str
     CONTENT: str
     IMAGE_BASE64: str
+    MAX_RETRIES: str
+    MODEL: str
     TEXT: str
+    TIMEOUT: str
     TYPE: str
 class InputType:

gllm_inference/em_invoker/twelevelabs_em_invoker.pyi CHANGED Viewed

@@ -1,5 +1,6 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.twelvelabs import InputType as InputType, Key as Key, OutputType as OutputType
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector

gllm_inference/em_invoker/voyage_em_invoker.pyi CHANGED Viewed

@@ -1,5 +1,6 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.em_invoker.em_invoker import BaseEMInvoker as BaseEMInvoker
 from gllm_inference.em_invoker.schema.voyage import InputType as InputType, Key as Key
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EMContent as EMContent, ModelId as ModelId, ModelProvider as ModelProvider, Vector as Vector

gllm_inference/lm_invoker/anthropic_lm_invoker.pyi CHANGED Viewed

@@ -1,6 +1,7 @@
 from _typeshed import Incomplete
 from gllm_core.event import EventEmitter as EventEmitter
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.lm_invoker import BaseLMInvoker as BaseLMInvoker
 from gllm_inference.lm_invoker.schema.anthropic import InputType as InputType, Key as Key, OutputType as OutputType
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EmitDataType as EmitDataType, LMOutput as LMOutput, Message as Message, ModelId as ModelId, ModelProvider as ModelProvider, Reasoning as Reasoning, ResponseSchema as ResponseSchema, TokenUsage as TokenUsage, ToolCall as ToolCall, ToolResult as ToolResult

gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi CHANGED Viewed

@@ -1,7 +1,8 @@
 from _typeshed import Incomplete
 from gllm_core.utils.retry import RetryConfig as RetryConfig
-from gllm_inference.constants import DEFAULT_AZURE_OPENAI_API_VERSION as DEFAULT_AZURE_OPENAI_API_VERSION
+from gllm_inference.constants import DEFAULT_AZURE_OPENAI_API_VERSION as DEFAULT_AZURE_OPENAI_API_VERSION, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.openai_lm_invoker import OpenAILMInvoker as OpenAILMInvoker, ReasoningEffort as ReasoningEffort, ReasoningSummary as ReasoningSummary
+from gllm_inference.lm_invoker.schema.openai import Key as Key
 from gllm_inference.schema import ModelId as ModelId, ModelProvider as ModelProvider, ResponseSchema as ResponseSchema
 from langchain_core.tools import Tool as Tool
 from typing import Any

gllm_inference/lm_invoker/datasaur_lm_invoker.pyi CHANGED Viewed

@@ -1,7 +1,7 @@
 from _typeshed import Incomplete
 from gllm_core.event import EventEmitter as EventEmitter
 from gllm_core.utils.retry import RetryConfig as RetryConfig
-from gllm_inference.constants import DOCUMENT_MIME_TYPES as DOCUMENT_MIME_TYPES
+from gllm_inference.constants import DOCUMENT_MIME_TYPES as DOCUMENT_MIME_TYPES, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.openai_compatible_lm_invoker import OpenAICompatibleLMInvoker as OpenAICompatibleLMInvoker
 from gllm_inference.lm_invoker.schema.datasaur import InputType as InputType, Key as Key
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, LMOutput as LMOutput, Message as Message, ModelId as ModelId, ModelProvider as ModelProvider, ResponseSchema as ResponseSchema, ToolCall as ToolCall, ToolResult as ToolResult

gllm_inference/lm_invoker/langchain_lm_invoker.pyi CHANGED Viewed

@@ -1,6 +1,7 @@
 from _typeshed import Incomplete
 from gllm_core.event import EventEmitter as EventEmitter
-from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_core.utils.retry import RetryConfig
+from gllm_inference.constants import INVOKER_DEFAULT_TIMEOUT as INVOKER_DEFAULT_TIMEOUT, INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.lm_invoker import BaseLMInvoker as BaseLMInvoker
 from gllm_inference.lm_invoker.schema.langchain import InputType as InputType, Key as Key
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, LMOutput as LMOutput, Message as Message, MessageRole as MessageRole, ModelId as ModelId, ModelProvider as ModelProvider, ResponseSchema as ResponseSchema, TokenUsage as TokenUsage, ToolCall as ToolCall, ToolResult as ToolResult

gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi CHANGED Viewed

@@ -1,6 +1,7 @@
 from _typeshed import Incomplete
 from gllm_core.event import EventEmitter as EventEmitter
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.lm_invoker import BaseLMInvoker as BaseLMInvoker
 from gllm_inference.lm_invoker.schema.openai_compatible import InputType as InputType, Key as Key, ReasoningEffort as ReasoningEffort
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, EmitDataType as EmitDataType, LMOutput as LMOutput, Message as Message, MessageRole as MessageRole, ModelId as ModelId, ModelProvider as ModelProvider, Reasoning as Reasoning, ResponseSchema as ResponseSchema, TokenUsage as TokenUsage, ToolCall as ToolCall, ToolResult as ToolResult

gllm_inference/lm_invoker/openai_lm_invoker.pyi CHANGED Viewed

@@ -1,6 +1,7 @@
 from _typeshed import Incomplete
 from gllm_core.event import EventEmitter as EventEmitter
 from gllm_core.utils.retry import RetryConfig as RetryConfig
+from gllm_inference.constants import INVOKER_PROPAGATED_MAX_RETRIES as INVOKER_PROPAGATED_MAX_RETRIES
 from gllm_inference.lm_invoker.lm_invoker import BaseLMInvoker as BaseLMInvoker
 from gllm_inference.lm_invoker.schema.openai import InputType as InputType, Key as Key, OutputType as OutputType, ReasoningEffort as ReasoningEffort, ReasoningSummary as ReasoningSummary
 from gllm_inference.schema import Attachment as Attachment, AttachmentType as AttachmentType, CodeExecResult as CodeExecResult, EmitDataType as EmitDataType, LMOutput as LMOutput, Message as Message, MessageRole as MessageRole, ModelId as ModelId, ModelProvider as ModelProvider, Reasoning as Reasoning, ResponseSchema as ResponseSchema, TokenUsage as TokenUsage, ToolCall as ToolCall, ToolResult as ToolResult

gllm_inference/lm_invoker/schema/anthropic.pyi CHANGED Viewed

@@ -8,6 +8,7 @@ class Key:
     ID: str
     INPUT: str
     INPUT_SCHEMA: str
+    MAX_RETRIES: str
     MEDIA_TYPE: str
     MAX_TOKENS: str
     NAME: str
@@ -17,6 +18,7 @@ class Key:
     SOURCE: str
     STOP_REASON: str
     SYSTEM: str
+    TIMEOUT: str
     THINKING: str
     TOOLS: str
     TOOL_CHOICE: str

gllm_inference/lm_invoker/schema/datasaur.pyi CHANGED Viewed

@@ -1,7 +1,9 @@
 class Key:
     """Defines valid keys in Datasaur."""
     CONTEXTS: str
+    MAX_RETRIES: str
     NAME: str
+    TIMEOUT: str
     TYPE: str
     URL: str

gllm_inference/lm_invoker/schema/google.pyi CHANGED Viewed

@@ -6,9 +6,12 @@ class Key:
     FINISH_REASON: str
     FUNCTION: str
     FUNCTION_CALL: str
+    HTTP_OPTIONS: str
     NAME: str
+    RETRY_OPTIONS: str
     SYSTEM_INSTRUCTION: str
     THINKING_CONFIG: str
+    TIMEOUT: str
     TOOLS: str
     RESPONSE_SCHEMA: str
     RESPONSE_MIME_TYPE: str

gllm_inference/lm_invoker/schema/langchain.pyi CHANGED Viewed

@@ -5,11 +5,13 @@ class Key:
     ID: str
     IMAGE_URL: str
     INPUT_TOKENS: str
+    MAX_RETRIES: str
     NAME: str
     OUTPUT_TOKENS: str
     PARSED: str
     RAW: str
     TEXT: str
+    TIMEOUT: str
     TYPE: str
     URL: str

gllm_inference/lm_invoker/schema/openai_compatible.pyi CHANGED Viewed

@@ -15,6 +15,7 @@ class Key:
     IMAGE_URL: str
     INPUT_AUDIO: str
     JSON_SCHEMA: str
+    MAX_RETRIES: str
     MESSAGE: str
     NAME: str
     RESPONSE_FORMAT: str
@@ -22,6 +23,7 @@ class Key:
     SCHEMA: str
     STRICT: str
     TEXT: str
+    TIMEOUT: str
     TITLE: str
     TOOLS: str
     TOOL_CALLS: str

gllm_inference.cpython-313-x86_64-linux-gnu.so CHANGED Viewed

Binary file

gllm_inference.pyi CHANGED Viewed

@@ -59,6 +59,7 @@ import langchain_core.embeddings
 import gllm_inference.utils.load_langchain_model
 import gllm_inference.utils.parse_model_data
 import io
+import httpx
 import twelvelabs
 import base64
 import sys
@@ -70,7 +71,6 @@ import enum
 import http
 import http.HTTPStatus
 import aiohttp
-import httpx
 import requests
 import gllm_inference.schema.ErrorResponse
 import gllm_core.constants

{gllm_inference_binary-0.5.5.dist-info → gllm_inference_binary-0.5.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: gllm-inference-binary
-Version: 0.5.5
+Version: 0.5.7
 Summary: A library containing components related to model inferences in Gen AI applications.
 Author: Henry Wicaksono
 Author-email: henry.wicaksono@gdplabs.id

{gllm_inference_binary-0.5.5.dist-info → gllm_inference_binary-0.5.7.dist-info}/RECORD RENAMED Viewed

@@ -2,49 +2,53 @@ gllm_inference/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 gllm_inference/builder/__init__.pyi,sha256=usz2lvfwO4Yk-ZGKXbCWG1cEr3nlQXxMNDNC-2yc1NM,500
 gllm_inference/builder/build_em_invoker.pyi,sha256=YL71GriZEXn4uxmXBJHWC200QdWRPwUJY_G0kKi5-dk,5352
 gllm_inference/builder/build_lm_invoker.pyi,sha256=aXdNU1gUBUz-4jZ-P791tlkmjOOInLYyeiveEJFlYZo,6468
-gllm_inference/builder/build_lm_request_processor.pyi,sha256=Mi0U3zga29FneTzzLeb_R0k4MM--LrNsl7xU4jd_12Y,4094
+gllm_inference/builder/build_lm_request_processor.pyi,sha256=33Gi3onftl-V2e_mkJios5zmXRKSoAVPX3UK7YBExjk,4491
 gllm_inference/builder/build_output_parser.pyi,sha256=_Lrq-bh1oPsb_Nwkkr_zyEUwIOMysRFZkvEtEM29LZM,936
 gllm_inference/catalog/__init__.pyi,sha256=JBkPGTyiiZ30GECzJBW-mW8LekWyY2qyzal3eW7ynaM,287
 gllm_inference/catalog/catalog.pyi,sha256=a4RNG1lKv51GxQpOqh47tz-PAROMPaeP2o5XNLBSZaU,4790
-gllm_inference/catalog/lm_request_processor_catalog.pyi,sha256=wjzufPEqey-byBU3hPWwEawT9c182WwjzSWOJ2bnqIs,4599
-gllm_inference/catalog/prompt_builder_catalog.pyi,sha256=o4JSzISjlStBataofZ2MB2_t3wnGTkkFJ3Dm_NSm5qo,3159
-gllm_inference/constants.pyi,sha256=A16iMdS6QLnDx7ToiVuu1rSxvEwcr0OMrghPUGQL0L4,220
+gllm_inference/catalog/lm_request_processor_catalog.pyi,sha256=ranHMbG9--DZj9FJRhIUa6U8e-L-Tm-_hSBpzJ6DDs4,5428
+gllm_inference/catalog/prompt_builder_catalog.pyi,sha256=OU8k_4HbqjZEzHZlzSM3uzGQZJmM2uGD76Csqom0CEQ,3197
+gllm_inference/constants.pyi,sha256=gPlwRHKIjUdyQoLdoog8ca76YmjrQL0SCDTEn8UEWSY,256
 gllm_inference/em_invoker/__init__.pyi,sha256=XESsrYo1PZeeHe7AMRyuzKoV7XDD5oN89ZTH01zRf4k,873
-gllm_inference/em_invoker/azure_openai_em_invoker.pyi,sha256=1HgCMcw7Hqv2ah4v9ma1Ioa-PpI-v2g7MfuKxxk2ZPU,4473
+gllm_inference/em_invoker/azure_openai_em_invoker.pyi,sha256=OEkVu5nv92ITqdhDtgDg4MiLSDRWDmLSnAhYtXpCn6E,4602
 gllm_inference/em_invoker/em_invoker.pyi,sha256=hiH8FB5R-KxhI8Ds2htF3cjRcIcH92yHPcOdpgc4FDo,4341
-gllm_inference/em_invoker/google_em_invoker.pyi,sha256=LQDUdsnOrB6ihBh0VdoOZHzFrY5dE3wWgBsl_slr1SI,6067
+gllm_inference/em_invoker/google_em_invoker.pyi,sha256=pn05VdOZXZOffeg89wlAQOBAyHyt6dLaS0Sd6LoH05M,6130
 gllm_inference/em_invoker/langchain/__init__.pyi,sha256=VYGKE5OgU0my1RlhgzkU_A7-GLGnUDDnNFuctuRwILE,148
 gllm_inference/em_invoker/langchain/em_invoker_embeddings.pyi,sha256=6nASLqi0FXCpqyYPl7kM3g7hAW-xS5ZwsS3GFudns98,2347
-gllm_inference/em_invoker/langchain_em_invoker.pyi,sha256=HSusS_ef5VZ20HPBFe153olueYOGQ57hmKY4406LUcE,2577
-gllm_inference/em_invoker/openai_compatible_em_invoker.pyi,sha256=GkoL-Z_Rl5v_NwcbvhUE6quLr6F9KnUB6Sb9Q712hNM,4802
-gllm_inference/em_invoker/openai_em_invoker.pyi,sha256=Gdyh93f8Mi3JYqnV1sBnYk1LAZpcsP47JeLjWxqyins,4070
+gllm_inference/em_invoker/langchain_em_invoker.pyi,sha256=lXiTTGcNOIwurZx3_6vWLE1DQyioK8Z1fOcPuUATnxA,2782
+gllm_inference/em_invoker/openai_compatible_em_invoker.pyi,sha256=Qz2Qx1KRKhzXr8IseDWcF_6yC-SNtfsXvQuGuKnqVe8,4978
+gllm_inference/em_invoker/openai_em_invoker.pyi,sha256=SFuS2DsvMHcibxFnpQOOchlZUyNRRlI2uMhVEUfifas,4235
 gllm_inference/em_invoker/schema/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-gllm_inference/em_invoker/schema/twelvelabs.pyi,sha256=y9nfqvuzs0o1jlZ5bwNmJkMSmvHAwBElWNMU0wJNc64,334
-gllm_inference/em_invoker/schema/voyage.pyi,sha256=7d9hv8uCJ4NboRaqK77g5ekb0X78pPW__sz2EYeKJKw,219
-gllm_inference/em_invoker/twelevelabs_em_invoker.pyi,sha256=9QctCbM6c9q5eHKIYEwVlhDmzcCysQupiT-4e8hllPE,4964
-gllm_inference/em_invoker/voyage_em_invoker.pyi,sha256=17NBfuii3FyBbNtNRT2y6FUMTMsDemanXnY1j_0dmZg,5032
+gllm_inference/em_invoker/schema/google.pyi,sha256=MUmgtjMmjSpzmzaAOx6JGZbcdRxgMUhOpvcVQIo-oGs,146
+gllm_inference/em_invoker/schema/langchain.pyi,sha256=onpZutqa2xw2g8rdJTdycy3ub58lkPBVB3KvVVPpyds,92
+gllm_inference/em_invoker/schema/openai.pyi,sha256=Q_dsEcodkOXYXPdrkOkW0LnuLhfeq8tEbtZAGMz2ajA,139
+gllm_inference/em_invoker/schema/openai_compatible.pyi,sha256=gmvGtsWoOMBelke_tZjC6dKimFBW9f4Vrgv0Ig0OM9Q,150
+gllm_inference/em_invoker/schema/twelvelabs.pyi,sha256=F6wKHgG01bYskJpKoheBSpRpHUfFpteKn9sj9n5YfcU,372
+gllm_inference/em_invoker/schema/voyage.pyi,sha256=HVpor0fqNy-IwapCICfsgFmqf1FJXCOMIxS2vOXhHd8,289
+gllm_inference/em_invoker/twelevelabs_em_invoker.pyi,sha256=6b8oJ8aLNBn45o85dka-Xbq9nWZqtcMgFls39ekEZ6o,5066
+gllm_inference/em_invoker/voyage_em_invoker.pyi,sha256=7akaf8GxOA8Trokad0xmlYKr49rY3Egm3_4gpW-vly8,5134
 gllm_inference/exceptions/__init__.pyi,sha256=v9uxjW5DssIn7n_bKqT7L83CeqFET2Z45GFOvi78UuE,977
 gllm_inference/exceptions/error_parser.pyi,sha256=4RkVfS2Fl9kjz_h2bK9eoAeI-Y-VkHcUqXWj68BsYig,2393
 gllm_inference/exceptions/exceptions.pyi,sha256=5YRackwVNvyOJjOtiVszqu8q87s8ioXTa-XwaYmeiC4,4643
 gllm_inference/lm_invoker/__init__.pyi,sha256=8oUFgavpItvjRUqsLqLSHqQVIPyTKCgNQ_euf58H2zY,1104
-gllm_inference/lm_invoker/anthropic_lm_invoker.pyi,sha256=Ihq8U4w_efN74gf-nDFUY_zXO4Hf4KYZ2YhWcu9MqNA,14663
-gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi,sha256=98ecMvAsEKEYNS1HehL3xTKT3MLdI9AfmJVOi9jeHXM,14407
+gllm_inference/lm_invoker/anthropic_lm_invoker.pyi,sha256=wdMwGusPNJ1etEOC9SQrSspCaqtU7w2yVP-gEJhUBO0,14765
+gllm_inference/lm_invoker/azure_openai_lm_invoker.pyi,sha256=cm5dXvbETJsfMWXRCpjGo5DTtDrT6vuO-ZTlljY4bWY,14536
 gllm_inference/lm_invoker/bedrock_lm_invoker.pyi,sha256=0ZeBJ_PWuFY2dOlON11VsI4BENhFJhK4md-8DwNpcyU,12300
-gllm_inference/lm_invoker/datasaur_lm_invoker.pyi,sha256=EzovSc7FXXZLoRrOuA2rFHmBAcBEohoBaUkAFk7hQig,9049
+gllm_inference/lm_invoker/datasaur_lm_invoker.pyi,sha256=m0R95-9dIaopIf5awLNmxs39qNeRHS_HJFBi51JCmK4,9115
 gllm_inference/lm_invoker/google_lm_invoker.pyi,sha256=dRK3_--UQEBEMkLItav9MeTXp5p-iM-pqzt2JnwocPU,16393
-gllm_inference/lm_invoker/langchain_lm_invoker.pyi,sha256=2p-JM7XojIi20wxKvu1n6eJWVeQz6P069M3Quoe5ViE,13018
+gllm_inference/lm_invoker/langchain_lm_invoker.pyi,sha256=jKyq1l4MyHNyi1Or4aWO0QLIX74_PttuNlSX8vPQyeA,13157
 gllm_inference/lm_invoker/litellm_lm_invoker.pyi,sha256=ad_tVyOjATiFyYF-f_1vX2Sl4BXy-fDXEW_D8fD1Db8,13037
 gllm_inference/lm_invoker/lm_invoker.pyi,sha256=XvcR2AAH_vnIdZ3cgDer59ZT724mW22_OSF8mpeo_kk,7610
-gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi,sha256=gHYFz7S8kTq1qkh-kqXOxkBAydUWxXJyoyNkL90Kvig,14759
-gllm_inference/lm_invoker/openai_lm_invoker.pyi,sha256=EsWW-XPmpmQ_27jFezJgT5lbpQf1Hj4O6MCvN63M3v0,19325
+gllm_inference/lm_invoker/openai_compatible_lm_invoker.pyi,sha256=-_9HW5ZpUUIAOTwdG1RAoWWRF712SPLhG1nbsQ_mShg,14861
+gllm_inference/lm_invoker/openai_lm_invoker.pyi,sha256=AugnEKSOtnupKDymAGrTihz14KhOxPigHmS143M4AuE,19427
 gllm_inference/lm_invoker/schema/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-gllm_inference/lm_invoker/schema/anthropic.pyi,sha256=Y7NAjB7H0Wmiwv3YGZuG83K1rOCjSDB6hoZ6LjndWss,971
+gllm_inference/lm_invoker/schema/anthropic.pyi,sha256=aftRPzTw-f2Qi32KABXEz0b8Lzza7EvDjQfiwJco1VE,1009
 gllm_inference/lm_invoker/schema/bedrock.pyi,sha256=FOUMZkBi6KRa__mYoy3FNJ5sP0EC6rgLuhoijnwelIg,927
-gllm_inference/lm_invoker/schema/datasaur.pyi,sha256=zi1aC2SHm4U54PPLuWIbFxdvTDuguhd4CGMOwziu0Ss,192
-gllm_inference/lm_invoker/schema/google.pyi,sha256=ZwEAo30lif7v1EgpwmKng6rzCPxPyUypyKBYkvLjJJE,443
-gllm_inference/lm_invoker/schema/langchain.pyi,sha256=-0JIiMFofXoHDoMtpaFUOysvrPGJBvjDFcNeomnWTSY,371
+gllm_inference/lm_invoker/schema/datasaur.pyi,sha256=aA4DhTXIezwLvFzphR24a5ueVln2FCBIloP9Hbt3iz4,230
+gllm_inference/lm_invoker/schema/google.pyi,sha256=AIsNgq0ZZuicHmx4bL7z6q-946T05nWts3HUeA8hhHQ,505
+gllm_inference/lm_invoker/schema/langchain.pyi,sha256=l2kHU7S3vmG3-NCt8B26krp_i4Br3waES_CekkgrKSA,409
 gllm_inference/lm_invoker/schema/openai.pyi,sha256=YogOvOZqPuWkNyfcvyzaxi-Bu7UMfcoRzk4gWtkPG08,1899
-gllm_inference/lm_invoker/schema/openai_compatible.pyi,sha256=iNaiEjYe_uQnhLdkp0XMhw-D1BCZR2qQZAwgMAM49us,1022
+gllm_inference/lm_invoker/schema/openai_compatible.pyi,sha256=LlZsjxGf5idMQ1G1gLF-AClpch7ACPVvTA6Snq8pf1M,1060
 gllm_inference/model/__init__.pyi,sha256=qClHIgljqhPPCKlGTKmHsWgYb4_hADybxtC2q1U8a5Q,593
 gllm_inference/model/em/__init__.pyi,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 gllm_inference/model/em/google_em.pyi,sha256=ZPN5LmReO0bcTfnZixFooUTzgD-daNFPzfxzZ-5WzQQ,471
@@ -86,8 +90,8 @@ gllm_inference/utils/__init__.pyi,sha256=npmBmmlBv7cPHMg1hdL3S2_RelD6vk_LhCsGELh
 gllm_inference/utils/langchain.pyi,sha256=VluQiHkGigDdqLUbhB6vnXiISCP5hHqV0qokYY6dC1A,1164
 gllm_inference/utils/validation.pyi,sha256=toxBtRp-VItC_X7sNi-GDd7sjibBdWMrR0q01OI2D7k,385
 gllm_inference.build/.gitignore,sha256=aEiIwOuxfzdCmLZe4oB1JsBmCUxwG8x-u-HBCV9JT8E,1
-gllm_inference.cpython-313-x86_64-linux-gnu.so,sha256=78tK6WVfJB74YyNsPx2RKbXvggLn6hnekiYnM8LpYFY,3899848
-gllm_inference.pyi,sha256=xOoh8lTQxXc6A4XYKBobWn8RJNszAlinAmbHPJyqi30,3315
-gllm_inference_binary-0.5.5.dist-info/METADATA,sha256=S9vLvAj1-yAb0qsT4OWsW2J6gHgJxgoIejXF_lRnoEU,4531
-gllm_inference_binary-0.5.5.dist-info/WHEEL,sha256=qGYSeeDMRvGsNMRKS15OK05VQRV6Z0DMQkqDjYiypg0,110
-gllm_inference_binary-0.5.5.dist-info/RECORD,,
+gllm_inference.cpython-313-x86_64-linux-gnu.so,sha256=RR-BNblfeJ7ln9jpcIGIcKx9tgSw87zIrO4_KNnUB5A,3957416
+gllm_inference.pyi,sha256=nZrexPebvXto11VCMpLhlbjUnuV_e4qk96992EjXDDM,3315
+gllm_inference_binary-0.5.7.dist-info/METADATA,sha256=5l9vCcKon7_P35hWo6n7VhczO9x6rBULOCosHG3l4sY,4531
+gllm_inference_binary-0.5.7.dist-info/WHEEL,sha256=qGYSeeDMRvGsNMRKS15OK05VQRV6Z0DMQkqDjYiypg0,110
+gllm_inference_binary-0.5.7.dist-info/RECORD,,

{gllm_inference_binary-0.5.5.dist-info → gllm_inference_binary-0.5.7.dist-info}/WHEEL RENAMED Viewed

File without changes