PyPI - model-library - Versions diffs - 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

model_library/base/base.py +237 -62
model_library/base/delegate_only.py +86 -9
model_library/base/input.py +10 -7
model_library/base/output.py +48 -0
model_library/base/utils.py +56 -7
model_library/config/alibaba_models.yaml +44 -57
model_library/config/all_models.json +253 -126
model_library/config/kimi_models.yaml +30 -3
model_library/config/openai_models.yaml +15 -23
model_library/config/zai_models.yaml +24 -3
model_library/exceptions.py +14 -77
model_library/logging.py +6 -2
model_library/providers/ai21labs.py +30 -14
model_library/providers/alibaba.py +17 -8
model_library/providers/amazon.py +119 -64
model_library/providers/anthropic.py +184 -104
model_library/providers/azure.py +22 -10
model_library/providers/cohere.py +7 -7
model_library/providers/deepseek.py +8 -8
model_library/providers/fireworks.py +7 -8
model_library/providers/google/batch.py +17 -13
model_library/providers/google/google.py +130 -73
model_library/providers/inception.py +7 -7
model_library/providers/kimi.py +18 -8
model_library/providers/minimax.py +30 -13
model_library/providers/mistral.py +61 -35
model_library/providers/openai.py +219 -93
model_library/providers/openrouter.py +34 -0
model_library/providers/perplexity.py +7 -7
model_library/providers/together.py +7 -8
model_library/providers/vals.py +16 -9
model_library/providers/xai.py +157 -144
model_library/providers/zai.py +38 -8
model_library/register_models.py +4 -2
model_library/registry_utils.py +39 -15
model_library/retriers/__init__.py +0 -0
model_library/retriers/backoff.py +73 -0
model_library/retriers/base.py +225 -0
model_library/retriers/token.py +427 -0
model_library/retriers/utils.py +11 -0
model_library/settings.py +1 -1
model_library/utils.py +13 -35
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/METADATA +4 -3
model_library-0.1.8.dist-info/RECORD +70 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/WHEEL +1 -1
model_library-0.1.6.dist-info/RECORD +0 -64
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/top_level.txt +0 -0

model_library/providers/mistral.py CHANGED Viewed

@@ -1,10 +1,15 @@
 import io
 import logging
-import time
 from collections.abc import Sequence
 from typing import Any, Literal
-from mistralai import AssistantMessage, ContentChunk, Mistral, TextChunk, ThinkChunk
+from mistralai import (
+    AssistantMessage,
+    ContentChunk,
+    Mistral,
+    TextChunk,
+    ThinkChunk,
+)
 from mistralai.models.completionevent import CompletionEvent
 from mistralai.models.toolcall import ToolCall as MistralToolCall
 from mistralai.utils.eventstreaming import EventStreamAsync
@@ -13,14 +18,16 @@ from typing_extensions import override
 from model_library import model_library_settings
 from model_library.base import (
     LLM,
+    FileBase,
     FileInput,
     FileWithBase64,
     FileWithId,
-    FileWithUrl,
     InputItem,
     LLMConfig,
     QueryResult,
     QueryResultMetadata,
+    RawInput,
+    RawResponse,
     TextInput,
     ToolBody,
     ToolCall,
@@ -39,16 +46,20 @@ from model_library.utils import default_httpx_client
 @register_provider("mistralai")
 class MistralModel(LLM):
-    _client: Mistral | None = None
+    @override
+    def _get_default_api_key(self) -> str:
+        return model_library_settings.MISTRAL_API_KEY
     @override
-    def get_client(self) -> Mistral:
-        if not MistralModel._client:
-            MistralModel._client = Mistral(
-                api_key=model_library_settings.MISTRAL_API_KEY,
+    def get_client(self, api_key: str | None = None) -> Mistral:
+        if not self.has_client():
+            assert api_key
+            client = Mistral(
+                api_key=api_key,
                 async_client=default_httpx_client(),
             )
-        return MistralModel._client
+            self.assign_client(client)
+        return super().get_client()
     def __init__(
         self,
@@ -69,27 +80,30 @@ class MistralModel(LLM):
         content_user: list[dict[str, Any]] = []
         def flush_content_user():
-            nonlocal content_user
             if content_user:
-                new_input.append({"role": "user", "content": content_user})
-                content_user = []
+                # NOTE: must make new object as we clear()
+                new_input.append({"role": "user", "content": content_user.copy()})
+                content_user.clear()
         for item in input:
+            if isinstance(item, TextInput):
+                content_user.append({"type": "text", "text": item.text})
+                continue
+            if isinstance(item, FileBase):
+                match item.type:
+                    case "image":
+                        parsed = await self.parse_image(item)
+                    case "file":
+                        parsed = await self.parse_file(item)
+                content_user.append(parsed)
+                continue
+            # non content user item
+            flush_content_user()
             match item:
-                case TextInput():
-                    content_user.append({"type": "text", "text": item.text})
-                case FileWithBase64() | FileWithUrl() | FileWithId():
-                    match item.type:
-                        case "image":
-                            content_user.append(await self.parse_image(item))
-                        case "file":
-                            content_user.append(await self.parse_file(item))
-                case AssistantMessage():
-                    flush_content_user()
-                    new_input.append(item)
                 case ToolResult():
-                    flush_content_user()
                     new_input.append(
                         {
                             "role": "tool",
@@ -98,9 +112,12 @@ class MistralModel(LLM):
                             "tool_call_id": item.tool_call.id,
                         }
                     )
-                case _:
-                    raise BadInputError("Unsupported input type")
+                case RawResponse():
+                    new_input.append(item.response)
+                case RawInput():
+                    new_input.append(item.input)
+        # in case content user item is the last item
         flush_content_user()
         return new_input
@@ -167,14 +184,13 @@ class MistralModel(LLM):
         raise NotImplementedError()
     @override
-    async def _query_impl(
+    async def build_body(
         self,
         input: Sequence[InputItem],
         *,
         tools: list[ToolDefinition],
-        query_logger: logging.Logger,
         **kwargs: object,
-    ) -> QueryResult:
+    ) -> dict[str, Any]:
         # mistral supports max 8 images, merge extra images into the 8th image
         input = trim_images(input, max_images=8)
@@ -192,12 +208,14 @@ class MistralModel(LLM):
         body: dict[str, Any] = {
             "model": self.model_name,
-            "max_tokens": self.max_tokens,
             "messages": messages,
             "prompt_mode": "reasoning" if self.reasoning else None,
             "tools": tools,
         }
+        if self.max_tokens:
+            body["max_tokens"] = self.max_tokens
         if self.supports_temperature:
             if self.temperature is not None:
                 body["temperature"] = self.temperature
@@ -205,8 +223,18 @@ class MistralModel(LLM):
                 body["top_p"] = self.top_p
         body.update(kwargs)
+        return body
-        start = time.time()
+    @override
+    async def _query_impl(
+        self,
+        input: Sequence[InputItem],
+        *,
+        tools: list[ToolDefinition],
+        query_logger: logging.Logger,
+        **kwargs: object,
+    ) -> QueryResult:
+        body = await self.build_body(input, tools=tools, **kwargs)
         response: EventStreamAsync[
             CompletionEvent
@@ -247,8 +275,6 @@ class MistralModel(LLM):
                     in_tokens += data.usage.prompt_tokens or 0
                     out_tokens += data.usage.completion_tokens or 0
-            self.logger.info(f"Finished in: {time.time() - start}")
         except Exception as e:
             self.logger.error(f"Error: {e}", exc_info=True)
             raise e
@@ -302,7 +328,7 @@ class MistralModel(LLM):
         return QueryResult(
             output_text=text,
             reasoning=reasoning or None,
-            history=[*input, message],
+            history=[*input, RawResponse(response=message)],
             tool_calls=tool_calls,
             metadata=QueryResultMetadata(
                 in_tokens=in_tokens,

model-library 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl