PyPI - mistralai - Versions diffs - 1.5.2__py3-none-any.whl → 1.6.0__py3-none-any.whl - Mend

mistralai 1.5.2py3-none-any.whl → 1.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (80) hide show

mistralai/_hooks/types.py +15 -3
mistralai/_version.py +3 -3
mistralai/agents.py +44 -12
mistralai/basesdk.py +8 -0
mistralai/chat.py +44 -12
mistralai/classifiers.py +36 -16
mistralai/embeddings.py +16 -6
mistralai/files.py +36 -0
mistralai/fim.py +32 -12
mistralai/httpclient.py +4 -2
mistralai/jobs.py +30 -0
mistralai/mistral_jobs.py +24 -0
mistralai/models/agentscompletionrequest.py +4 -0
mistralai/models/agentscompletionstreamrequest.py +4 -0
mistralai/models/chatcompletionrequest.py +4 -0
mistralai/models/chatcompletionstreamrequest.py +4 -0
mistralai/models/function.py +2 -2
mistralai/models/jsonschema.py +1 -1
mistralai/models_.py +66 -18
mistralai/ocr.py +16 -6
mistralai/sdk.py +19 -3
mistralai/sdkconfiguration.py +4 -2
mistralai/utils/__init__.py +2 -0
mistralai/utils/serializers.py +10 -6
mistralai/utils/values.py +4 -1
{mistralai-1.5.2.dist-info → mistralai-1.6.0.dist-info}/METADATA +63 -16
{mistralai-1.5.2.dist-info → mistralai-1.6.0.dist-info}/RECORD +80 -72
mistralai_azure/__init__.py +10 -1
mistralai_azure/_hooks/types.py +15 -3
mistralai_azure/_version.py +4 -1
mistralai_azure/basesdk.py +8 -0
mistralai_azure/chat.py +100 -20
mistralai_azure/httpclient.py +52 -0
mistralai_azure/models/__init__.py +22 -0
mistralai_azure/models/assistantmessage.py +2 -0
mistralai_azure/models/chatcompletionrequest.py +12 -10
mistralai_azure/models/chatcompletionstreamrequest.py +12 -10
mistralai_azure/models/contentchunk.py +6 -2
mistralai_azure/models/function.py +4 -1
mistralai_azure/models/imageurl.py +53 -0
mistralai_azure/models/imageurlchunk.py +33 -0
mistralai_azure/models/jsonschema.py +61 -0
mistralai_azure/models/prediction.py +25 -0
mistralai_azure/models/responseformat.py +42 -1
mistralai_azure/models/responseformats.py +1 -1
mistralai_azure/models/toolcall.py +3 -0
mistralai_azure/sdk.py +56 -14
mistralai_azure/sdkconfiguration.py +14 -6
mistralai_azure/utils/__init__.py +2 -0
mistralai_azure/utils/serializers.py +10 -6
mistralai_azure/utils/values.py +4 -1
mistralai_gcp/__init__.py +10 -1
mistralai_gcp/_hooks/types.py +15 -3
mistralai_gcp/_version.py +4 -1
mistralai_gcp/basesdk.py +8 -0
mistralai_gcp/chat.py +101 -21
mistralai_gcp/fim.py +61 -21
mistralai_gcp/httpclient.py +52 -0
mistralai_gcp/models/__init__.py +22 -0
mistralai_gcp/models/assistantmessage.py +2 -0
mistralai_gcp/models/chatcompletionrequest.py +12 -10
mistralai_gcp/models/chatcompletionstreamrequest.py +12 -10
mistralai_gcp/models/contentchunk.py +6 -2
mistralai_gcp/models/fimcompletionrequest.py +2 -3
mistralai_gcp/models/fimcompletionstreamrequest.py +2 -3
mistralai_gcp/models/function.py +4 -1
mistralai_gcp/models/imageurl.py +53 -0
mistralai_gcp/models/imageurlchunk.py +33 -0
mistralai_gcp/models/jsonschema.py +61 -0
mistralai_gcp/models/prediction.py +25 -0
mistralai_gcp/models/responseformat.py +42 -1
mistralai_gcp/models/responseformats.py +1 -1
mistralai_gcp/models/toolcall.py +3 -0
mistralai_gcp/sdk.py +63 -19
mistralai_gcp/sdkconfiguration.py +14 -6
mistralai_gcp/utils/__init__.py +2 -0
mistralai_gcp/utils/serializers.py +10 -6
mistralai_gcp/utils/values.py +4 -1
{mistralai-1.5.2.dist-info → mistralai-1.6.0.dist-info}/LICENSE +0 -0
{mistralai-1.5.2.dist-info → mistralai-1.6.0.dist-info}/WHEEL +0 -0

mistralai_azure/basesdk.py CHANGED Viewed

@@ -231,6 +231,10 @@ class BaseSDK:
                     req.headers,
                     get_body_content(req),
                 )
+                if client is None:
+                    raise ValueError("client is required")
                 http_res = client.send(req, stream=stream)
             except Exception as e:
                 _, e = self.sdk_configuration.get_hooks().after_error(
@@ -303,6 +307,10 @@ class BaseSDK:
                     req.headers,
                     get_body_content(req),
                 )
+                if client is None:
+                    raise ValueError("client is required")
                 http_res = await client.send(req, stream=stream)
             except Exception as e:
                 _, e = self.sdk_configuration.get_hooks().after_error(

mistralai_azure/chat.py CHANGED Viewed

@@ -15,7 +15,7 @@ class Chat(BaseSDK):
         self,
         *,
         messages: Union[List[models.Messages], List[models.MessagesTypedDict]],
-        model: OptionalNullable[str] = "azureai",
+        model: Optional[str] = "azureai",
         temperature: OptionalNullable[float] = UNSET,
         top_p: Optional[float] = None,
         max_tokens: OptionalNullable[int] = UNSET,
@@ -37,6 +37,10 @@ class Chat(BaseSDK):
         presence_penalty: Optional[float] = None,
         frequency_penalty: Optional[float] = None,
         n: OptionalNullable[int] = UNSET,
+        prediction: Optional[
+            Union[models.Prediction, models.PredictionTypedDict]
+        ] = None,
+        parallel_tool_calls: Optional[bool] = None,
         safe_prompt: Optional[bool] = None,
         retries: OptionalNullable[utils.RetryConfig] = UNSET,
         server_url: Optional[str] = None,
@@ -61,6 +65,8 @@ class Chat(BaseSDK):
         :param presence_penalty: presence_penalty determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative.
         :param frequency_penalty: frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition.
         :param n: Number of completions to return for each request, input tokens are only billed once.
+        :param prediction:
+        :param parallel_tool_calls:
         :param safe_prompt: Whether to inject a safety prompt before all conversations.
         :param retries: Override the default retry configuration for this method
         :param server_url: Override the default server URL for this method
@@ -74,6 +80,8 @@ class Chat(BaseSDK):
         if server_url is not None:
             base_url = server_url
+        else:
+            base_url = self._get_url(base_url, url_variables)
         request = models.ChatCompletionStreamRequest(
             model=model,
@@ -94,6 +102,10 @@ class Chat(BaseSDK):
             presence_penalty=presence_penalty,
             frequency_penalty=frequency_penalty,
             n=n,
+            prediction=utils.get_pydantic_model(
+                prediction, Optional[models.Prediction]
+            ),
+            parallel_tool_calls=parallel_tool_calls,
             safe_prompt=safe_prompt,
         )
@@ -126,6 +138,7 @@ class Chat(BaseSDK):
         http_res = self.do_request(
             hook_ctx=HookContext(
+                base_url=base_url or "",
                 operation_id="stream_chat",
                 oauth2_scopes=[],
                 security_source=self.sdk_configuration.security,
@@ -136,7 +149,7 @@ class Chat(BaseSDK):
             retry_config=retry_config,
         )
-        data: Any = None
+        response_data: Any = None
         if utils.match_response(http_res, "200", "text/event-stream"):
             return eventstreaming.EventStream(
                 http_res,
@@ -145,9 +158,16 @@ class Chat(BaseSDK):
             )
         if utils.match_response(http_res, "422", "application/json"):
             http_res_text = utils.stream_to_text(http_res)
-            data = utils.unmarshal_json(http_res_text, models.HTTPValidationErrorData)
-            raise models.HTTPValidationError(data=data)
-        if utils.match_response(http_res, ["4XX", "5XX"], "*"):
+            response_data = utils.unmarshal_json(
+                http_res_text, models.HTTPValidationErrorData
+            )
+            raise models.HTTPValidationError(data=response_data)
+        if utils.match_response(http_res, "4XX", "*"):
+            http_res_text = utils.stream_to_text(http_res)
+            raise models.SDKError(
+                "API error occurred", http_res.status_code, http_res_text, http_res
+            )
+        if utils.match_response(http_res, "5XX", "*"):
             http_res_text = utils.stream_to_text(http_res)
             raise models.SDKError(
                 "API error occurred", http_res.status_code, http_res_text, http_res
@@ -166,7 +186,7 @@ class Chat(BaseSDK):
         self,
         *,
         messages: Union[List[models.Messages], List[models.MessagesTypedDict]],
-        model: OptionalNullable[str] = "azureai",
+        model: Optional[str] = "azureai",
         temperature: OptionalNullable[float] = UNSET,
         top_p: Optional[float] = None,
         max_tokens: OptionalNullable[int] = UNSET,
@@ -188,6 +208,10 @@ class Chat(BaseSDK):
         presence_penalty: Optional[float] = None,
         frequency_penalty: Optional[float] = None,
         n: OptionalNullable[int] = UNSET,
+        prediction: Optional[
+            Union[models.Prediction, models.PredictionTypedDict]
+        ] = None,
+        parallel_tool_calls: Optional[bool] = None,
         safe_prompt: Optional[bool] = None,
         retries: OptionalNullable[utils.RetryConfig] = UNSET,
         server_url: Optional[str] = None,
@@ -212,6 +236,8 @@ class Chat(BaseSDK):
         :param presence_penalty: presence_penalty determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative.
         :param frequency_penalty: frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition.
         :param n: Number of completions to return for each request, input tokens are only billed once.
+        :param prediction:
+        :param parallel_tool_calls:
         :param safe_prompt: Whether to inject a safety prompt before all conversations.
         :param retries: Override the default retry configuration for this method
         :param server_url: Override the default server URL for this method
@@ -225,6 +251,8 @@ class Chat(BaseSDK):
         if server_url is not None:
             base_url = server_url
+        else:
+            base_url = self._get_url(base_url, url_variables)
         request = models.ChatCompletionStreamRequest(
             model=model,
@@ -245,6 +273,10 @@ class Chat(BaseSDK):
             presence_penalty=presence_penalty,
             frequency_penalty=frequency_penalty,
             n=n,
+            prediction=utils.get_pydantic_model(
+                prediction, Optional[models.Prediction]
+            ),
+            parallel_tool_calls=parallel_tool_calls,
             safe_prompt=safe_prompt,
         )
@@ -277,6 +309,7 @@ class Chat(BaseSDK):
         http_res = await self.do_request_async(
             hook_ctx=HookContext(
+                base_url=base_url or "",
                 operation_id="stream_chat",
                 oauth2_scopes=[],
                 security_source=self.sdk_configuration.security,
@@ -287,7 +320,7 @@ class Chat(BaseSDK):
             retry_config=retry_config,
         )
-        data: Any = None
+        response_data: Any = None
         if utils.match_response(http_res, "200", "text/event-stream"):
             return eventstreaming.EventStreamAsync(
                 http_res,
@@ -296,9 +329,16 @@ class Chat(BaseSDK):
             )
         if utils.match_response(http_res, "422", "application/json"):
             http_res_text = await utils.stream_to_text_async(http_res)
-            data = utils.unmarshal_json(http_res_text, models.HTTPValidationErrorData)
-            raise models.HTTPValidationError(data=data)
-        if utils.match_response(http_res, ["4XX", "5XX"], "*"):
+            response_data = utils.unmarshal_json(
+                http_res_text, models.HTTPValidationErrorData
+            )
+            raise models.HTTPValidationError(data=response_data)
+        if utils.match_response(http_res, "4XX", "*"):
+            http_res_text = await utils.stream_to_text_async(http_res)
+            raise models.SDKError(
+                "API error occurred", http_res.status_code, http_res_text, http_res
+            )
+        if utils.match_response(http_res, "5XX", "*"):
             http_res_text = await utils.stream_to_text_async(http_res)
             raise models.SDKError(
                 "API error occurred", http_res.status_code, http_res_text, http_res
@@ -320,7 +360,7 @@ class Chat(BaseSDK):
             List[models.ChatCompletionRequestMessages],
             List[models.ChatCompletionRequestMessagesTypedDict],
         ],
-        model: OptionalNullable[str] = "azureai",
+        model: Optional[str] = "azureai",
         temperature: OptionalNullable[float] = UNSET,
         top_p: Optional[float] = None,
         max_tokens: OptionalNullable[int] = UNSET,
@@ -347,6 +387,10 @@ class Chat(BaseSDK):
         presence_penalty: Optional[float] = None,
         frequency_penalty: Optional[float] = None,
         n: OptionalNullable[int] = UNSET,
+        prediction: Optional[
+            Union[models.Prediction, models.PredictionTypedDict]
+        ] = None,
+        parallel_tool_calls: Optional[bool] = None,
         safe_prompt: Optional[bool] = None,
         retries: OptionalNullable[utils.RetryConfig] = UNSET,
         server_url: Optional[str] = None,
@@ -369,6 +413,8 @@ class Chat(BaseSDK):
         :param presence_penalty: presence_penalty determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative.
         :param frequency_penalty: frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition.
         :param n: Number of completions to return for each request, input tokens are only billed once.
+        :param prediction:
+        :param parallel_tool_calls:
         :param safe_prompt: Whether to inject a safety prompt before all conversations.
         :param retries: Override the default retry configuration for this method
         :param server_url: Override the default server URL for this method
@@ -382,6 +428,8 @@ class Chat(BaseSDK):
         if server_url is not None:
             base_url = server_url
+        else:
+            base_url = self._get_url(base_url, url_variables)
         request = models.ChatCompletionRequest(
             model=model,
@@ -404,6 +452,10 @@ class Chat(BaseSDK):
             presence_penalty=presence_penalty,
             frequency_penalty=frequency_penalty,
             n=n,
+            prediction=utils.get_pydantic_model(
+                prediction, Optional[models.Prediction]
+            ),
+            parallel_tool_calls=parallel_tool_calls,
             safe_prompt=safe_prompt,
         )
@@ -436,6 +488,7 @@ class Chat(BaseSDK):
         http_res = self.do_request(
             hook_ctx=HookContext(
+                base_url=base_url or "",
                 operation_id="chat_completion_v1_chat_completions_post",
                 oauth2_scopes=[],
                 security_source=self.sdk_configuration.security,
@@ -445,15 +498,22 @@ class Chat(BaseSDK):
             retry_config=retry_config,
         )
-        data: Any = None
+        response_data: Any = None
         if utils.match_response(http_res, "200", "application/json"):
             return utils.unmarshal_json(
                 http_res.text, Optional[models.ChatCompletionResponse]
             )
         if utils.match_response(http_res, "422", "application/json"):
-            data = utils.unmarshal_json(http_res.text, models.HTTPValidationErrorData)
-            raise models.HTTPValidationError(data=data)
-        if utils.match_response(http_res, ["4XX", "5XX"], "*"):
+            response_data = utils.unmarshal_json(
+                http_res.text, models.HTTPValidationErrorData
+            )
+            raise models.HTTPValidationError(data=response_data)
+        if utils.match_response(http_res, "4XX", "*"):
+            http_res_text = utils.stream_to_text(http_res)
+            raise models.SDKError(
+                "API error occurred", http_res.status_code, http_res_text, http_res
+            )
+        if utils.match_response(http_res, "5XX", "*"):
             http_res_text = utils.stream_to_text(http_res)
             raise models.SDKError(
                 "API error occurred", http_res.status_code, http_res_text, http_res
@@ -475,7 +535,7 @@ class Chat(BaseSDK):
             List[models.ChatCompletionRequestMessages],
             List[models.ChatCompletionRequestMessagesTypedDict],
         ],
-        model: OptionalNullable[str] = "azureai",
+        model: Optional[str] = "azureai",
         temperature: OptionalNullable[float] = UNSET,
         top_p: Optional[float] = None,
         max_tokens: OptionalNullable[int] = UNSET,
@@ -502,6 +562,10 @@ class Chat(BaseSDK):
         presence_penalty: Optional[float] = None,
         frequency_penalty: Optional[float] = None,
         n: OptionalNullable[int] = UNSET,
+        prediction: Optional[
+            Union[models.Prediction, models.PredictionTypedDict]
+        ] = None,
+        parallel_tool_calls: Optional[bool] = None,
         safe_prompt: Optional[bool] = None,
         retries: OptionalNullable[utils.RetryConfig] = UNSET,
         server_url: Optional[str] = None,
@@ -524,6 +588,8 @@ class Chat(BaseSDK):
         :param presence_penalty: presence_penalty determines how much the model penalizes the repetition of words or phrases. A higher presence penalty encourages the model to use a wider variety of words and phrases, making the output more diverse and creative.
         :param frequency_penalty: frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition.
         :param n: Number of completions to return for each request, input tokens are only billed once.
+        :param prediction:
+        :param parallel_tool_calls:
         :param safe_prompt: Whether to inject a safety prompt before all conversations.
         :param retries: Override the default retry configuration for this method
         :param server_url: Override the default server URL for this method
@@ -537,6 +603,8 @@ class Chat(BaseSDK):
         if server_url is not None:
             base_url = server_url
+        else:
+            base_url = self._get_url(base_url, url_variables)
         request = models.ChatCompletionRequest(
             model=model,
@@ -559,6 +627,10 @@ class Chat(BaseSDK):
             presence_penalty=presence_penalty,
             frequency_penalty=frequency_penalty,
             n=n,
+            prediction=utils.get_pydantic_model(
+                prediction, Optional[models.Prediction]
+            ),
+            parallel_tool_calls=parallel_tool_calls,
             safe_prompt=safe_prompt,
         )
@@ -591,6 +663,7 @@ class Chat(BaseSDK):
         http_res = await self.do_request_async(
             hook_ctx=HookContext(
+                base_url=base_url or "",
                 operation_id="chat_completion_v1_chat_completions_post",
                 oauth2_scopes=[],
                 security_source=self.sdk_configuration.security,
@@ -600,15 +673,22 @@ class Chat(BaseSDK):
             retry_config=retry_config,
         )
-        data: Any = None
+        response_data: Any = None
         if utils.match_response(http_res, "200", "application/json"):
             return utils.unmarshal_json(
                 http_res.text, Optional[models.ChatCompletionResponse]
             )
         if utils.match_response(http_res, "422", "application/json"):
-            data = utils.unmarshal_json(http_res.text, models.HTTPValidationErrorData)
-            raise models.HTTPValidationError(data=data)
-        if utils.match_response(http_res, ["4XX", "5XX"], "*"):
+            response_data = utils.unmarshal_json(
+                http_res.text, models.HTTPValidationErrorData
+            )
+            raise models.HTTPValidationError(data=response_data)
+        if utils.match_response(http_res, "4XX", "*"):
+            http_res_text = await utils.stream_to_text_async(http_res)
+            raise models.SDKError(
+                "API error occurred", http_res.status_code, http_res_text, http_res
+            )
+        if utils.match_response(http_res, "5XX", "*"):
             http_res_text = await utils.stream_to_text_async(http_res)
             raise models.SDKError(
                 "API error occurred", http_res.status_code, http_res_text, http_res

mistralai_azure/httpclient.py CHANGED Viewed

@@ -1,6 +1,8 @@
 """Code generated by Speakeasy (https://speakeasy.com). DO NOT EDIT."""
 # pyright: reportReturnType = false
+import asyncio
+from concurrent.futures import ThreadPoolExecutor
 from typing_extensions import Protocol, runtime_checkable
 import httpx
 from typing import Any, Optional, Union
@@ -82,3 +84,53 @@ class AsyncHttpClient(Protocol):
     async def aclose(self) -> None:
         pass
+class ClientOwner(Protocol):
+    client: Union[HttpClient, None]
+    async_client: Union[AsyncHttpClient, None]
+def close_clients(
+    owner: ClientOwner,
+    sync_client: Union[HttpClient, None],
+    sync_client_supplied: bool,
+    async_client: Union[AsyncHttpClient, None],
+    async_client_supplied: bool,
+) -> None:
+    """
+    A finalizer function that is meant to be used with weakref.finalize to close
+    httpx clients used by an SDK so that underlying resources can be garbage
+    collected.
+    """
+    # Unset the client/async_client properties so there are no more references
+    # to them from the owning SDK instance and they can be reaped.
+    owner.client = None
+    owner.async_client = None
+    if sync_client is not None and not sync_client_supplied:
+        try:
+            sync_client.close()
+        except Exception:
+            pass
+    if async_client is not None and not async_client_supplied:
+        is_async = False
+        try:
+            asyncio.get_running_loop()
+            is_async = True
+        except RuntimeError:
+            pass
+        try:
+            # If this function is called in an async loop then start another
+            # loop in a separate thread to close the async http client.
+            if is_async:
+                with ThreadPoolExecutor(max_workers=1) as executor:
+                    future = executor.submit(asyncio.run, async_client.aclose())
+                    future.result()
+            else:
+                asyncio.run(async_client.aclose())
+        except Exception:
+            pass

mistralai_azure/models/__init__.py CHANGED Viewed

@@ -54,6 +54,16 @@ from .functioncall import (
 )
 from .functionname import FunctionName, FunctionNameTypedDict
 from .httpvalidationerror import HTTPValidationError, HTTPValidationErrorData
+from .imageurl import ImageURL, ImageURLTypedDict
+from .imageurlchunk import (
+    ImageURLChunk,
+    ImageURLChunkImageURL,
+    ImageURLChunkImageURLTypedDict,
+    ImageURLChunkType,
+    ImageURLChunkTypedDict,
+)
+from .jsonschema import JSONSchema, JSONSchemaTypedDict
+from .prediction import Prediction, PredictionTypedDict
 from .referencechunk import ReferenceChunk, ReferenceChunkType, ReferenceChunkTypedDict
 from .responseformat import ResponseFormat, ResponseFormatTypedDict
 from .responseformats import ResponseFormats
@@ -94,6 +104,7 @@ from .validationerror import (
     ValidationErrorTypedDict,
 )
 __all__ = [
     "Arguments",
     "ArgumentsTypedDict",
@@ -140,10 +151,21 @@ __all__ = [
     "FunctionTypedDict",
     "HTTPValidationError",
     "HTTPValidationErrorData",
+    "ImageURL",
+    "ImageURLChunk",
+    "ImageURLChunkImageURL",
+    "ImageURLChunkImageURLTypedDict",
+    "ImageURLChunkType",
+    "ImageURLChunkTypedDict",
+    "ImageURLTypedDict",
+    "JSONSchema",
+    "JSONSchemaTypedDict",
     "Loc",
     "LocTypedDict",
     "Messages",
     "MessagesTypedDict",
+    "Prediction",
+    "PredictionTypedDict",
     "ReferenceChunk",
     "ReferenceChunkType",
     "ReferenceChunkTypedDict",

mistralai_azure/models/assistantmessage.py CHANGED Viewed

@@ -32,6 +32,7 @@ class AssistantMessageTypedDict(TypedDict):
     content: NotRequired[Nullable[AssistantMessageContentTypedDict]]
     tool_calls: NotRequired[Nullable[List[ToolCallTypedDict]]]
     prefix: NotRequired[bool]
+    r"""Set this to `true` when adding an assistant message as prefix to condition the model response. The role of the prefix message is to force the model to start its answer by the content of the message."""
     role: NotRequired[AssistantMessageRole]
@@ -41,6 +42,7 @@ class AssistantMessage(BaseModel):
     tool_calls: OptionalNullable[List[ToolCall]] = UNSET
     prefix: Optional[bool] = False
+    r"""Set this to `true` when adding an assistant message as prefix to condition the model response. The role of the prefix message is to force the model to start its answer by the content of the message."""
     role: Optional[AssistantMessageRole] = "assistant"

mistralai_azure/models/chatcompletionrequest.py CHANGED Viewed

@@ -2,6 +2,7 @@
 from __future__ import annotations
 from .assistantmessage import AssistantMessage, AssistantMessageTypedDict
+from .prediction import Prediction, PredictionTypedDict
 from .responseformat import ResponseFormat, ResponseFormatTypedDict
 from .systemmessage import SystemMessage, SystemMessageTypedDict
 from .tool import Tool, ToolTypedDict
@@ -70,7 +71,7 @@ ChatCompletionRequestToolChoice = TypeAliasType(
 class ChatCompletionRequestTypedDict(TypedDict):
     messages: List[ChatCompletionRequestMessagesTypedDict]
     r"""The prompt(s) to generate completions for, encoded as a list of dict with role and content."""
-    model: NotRequired[Nullable[str]]
+    model: NotRequired[str]
     r"""The ID of the model to use for this request."""
     temperature: NotRequired[Nullable[float]]
     r"""What sampling temperature to use, we recommend between 0.0 and 0.7. Higher values like 0.7 will make the output more random, while lower values like 0.2 will make it more focused and deterministic. We generally recommend altering this or `top_p` but not both. The default value varies depending on the model you are targeting. Call the `/models` endpoint to retrieve the appropriate value."""
@@ -93,6 +94,8 @@ class ChatCompletionRequestTypedDict(TypedDict):
     r"""frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition."""
     n: NotRequired[Nullable[int]]
     r"""Number of completions to return for each request, input tokens are only billed once."""
+    prediction: NotRequired[PredictionTypedDict]
+    parallel_tool_calls: NotRequired[bool]
     safe_prompt: NotRequired[bool]
     r"""Whether to inject a safety prompt before all conversations."""
@@ -101,7 +104,7 @@ class ChatCompletionRequest(BaseModel):
     messages: List[ChatCompletionRequestMessages]
     r"""The prompt(s) to generate completions for, encoded as a list of dict with role and content."""
-    model: OptionalNullable[str] = "azureai"
+    model: Optional[str] = "azureai"
     r"""The ID of the model to use for this request."""
     temperature: OptionalNullable[float] = UNSET
@@ -137,6 +140,10 @@ class ChatCompletionRequest(BaseModel):
     n: OptionalNullable[int] = UNSET
     r"""Number of completions to return for each request, input tokens are only billed once."""
+    prediction: Optional[Prediction] = None
+    parallel_tool_calls: Optional[bool] = None
     safe_prompt: Optional[bool] = None
     r"""Whether to inject a safety prompt before all conversations."""
@@ -156,16 +163,11 @@ class ChatCompletionRequest(BaseModel):
             "presence_penalty",
             "frequency_penalty",
             "n",
+            "prediction",
+            "parallel_tool_calls",
             "safe_prompt",
         ]
-        nullable_fields = [
-            "model",
-            "temperature",
-            "max_tokens",
-            "random_seed",
-            "tools",
-            "n",
-        ]
+        nullable_fields = ["temperature", "max_tokens", "random_seed", "tools", "n"]
         null_default_fields = []
         serialized = handler(self)

mistralai_azure/models/chatcompletionstreamrequest.py CHANGED Viewed

@@ -2,6 +2,7 @@
 from __future__ import annotations
 from .assistantmessage import AssistantMessage, AssistantMessageTypedDict
+from .prediction import Prediction, PredictionTypedDict
 from .responseformat import ResponseFormat, ResponseFormatTypedDict
 from .systemmessage import SystemMessage, SystemMessageTypedDict
 from .tool import Tool, ToolTypedDict
@@ -66,7 +67,7 @@ ChatCompletionStreamRequestToolChoice = TypeAliasType(
 class ChatCompletionStreamRequestTypedDict(TypedDict):
     messages: List[MessagesTypedDict]
     r"""The prompt(s) to generate completions for, encoded as a list of dict with role and content."""
-    model: NotRequired[Nullable[str]]
+    model: NotRequired[str]
     r"""The ID of the model to use for this request."""
     temperature: NotRequired[Nullable[float]]
     r"""What sampling temperature to use, we recommend between 0.0 and 0.7. Higher values like 0.7 will make the output more random, while lower values like 0.2 will make it more focused and deterministic. We generally recommend altering this or `top_p` but not both. The default value varies depending on the model you are targeting. Call the `/models` endpoint to retrieve the appropriate value."""
@@ -88,6 +89,8 @@ class ChatCompletionStreamRequestTypedDict(TypedDict):
     r"""frequency_penalty penalizes the repetition of words based on their frequency in the generated text. A higher frequency penalty discourages the model from repeating words that have already appeared frequently in the output, promoting diversity and reducing repetition."""
     n: NotRequired[Nullable[int]]
     r"""Number of completions to return for each request, input tokens are only billed once."""
+    prediction: NotRequired[PredictionTypedDict]
+    parallel_tool_calls: NotRequired[bool]
     safe_prompt: NotRequired[bool]
     r"""Whether to inject a safety prompt before all conversations."""
@@ -96,7 +99,7 @@ class ChatCompletionStreamRequest(BaseModel):
     messages: List[Messages]
     r"""The prompt(s) to generate completions for, encoded as a list of dict with role and content."""
-    model: OptionalNullable[str] = "azureai"
+    model: Optional[str] = "azureai"
     r"""The ID of the model to use for this request."""
     temperature: OptionalNullable[float] = UNSET
@@ -131,6 +134,10 @@ class ChatCompletionStreamRequest(BaseModel):
     n: OptionalNullable[int] = UNSET
     r"""Number of completions to return for each request, input tokens are only billed once."""
+    prediction: Optional[Prediction] = None
+    parallel_tool_calls: Optional[bool] = None
     safe_prompt: Optional[bool] = None
     r"""Whether to inject a safety prompt before all conversations."""
@@ -150,16 +157,11 @@ class ChatCompletionStreamRequest(BaseModel):
             "presence_penalty",
             "frequency_penalty",
             "n",
+            "prediction",
+            "parallel_tool_calls",
             "safe_prompt",
         ]
-        nullable_fields = [
-            "model",
-            "temperature",
-            "max_tokens",
-            "random_seed",
-            "tools",
-            "n",
-        ]
+        nullable_fields = ["temperature", "max_tokens", "random_seed", "tools", "n"]
         null_default_fields = []
         serialized = handler(self)

mistralai_azure/models/contentchunk.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """Code generated by Speakeasy (https://speakeasy.com). DO NOT EDIT."""
 from __future__ import annotations
+from .imageurlchunk import ImageURLChunk, ImageURLChunkTypedDict
 from .referencechunk import ReferenceChunk, ReferenceChunkTypedDict
 from .textchunk import TextChunk, TextChunkTypedDict
 from mistralai_azure.utils import get_discriminator
@@ -10,13 +11,16 @@ from typing_extensions import Annotated, TypeAliasType
 ContentChunkTypedDict = TypeAliasType(
-    "ContentChunkTypedDict", Union[TextChunkTypedDict, ReferenceChunkTypedDict]
+    "ContentChunkTypedDict",
+    Union[TextChunkTypedDict, ImageURLChunkTypedDict, ReferenceChunkTypedDict],
 )
 ContentChunk = Annotated[
     Union[
-        Annotated[TextChunk, Tag("text")], Annotated[ReferenceChunk, Tag("reference")]
+        Annotated[ImageURLChunk, Tag("image_url")],
+        Annotated[TextChunk, Tag("text")],
+        Annotated[ReferenceChunk, Tag("reference")],
     ],
     Discriminator(lambda m: get_discriminator(m, "type", "type")),
 ]

mistralai_azure/models/function.py CHANGED Viewed

@@ -10,6 +10,7 @@ class FunctionTypedDict(TypedDict):
     name: str
     parameters: Dict[str, Any]
     description: NotRequired[str]
+    strict: NotRequired[bool]
 class Function(BaseModel):
@@ -17,4 +18,6 @@ class Function(BaseModel):
     parameters: Dict[str, Any]
-    description: Optional[str] = ""
+    description: Optional[str] = None
+    strict: Optional[bool] = None

mistralai 1.5.2__py3-none-any.whl → 1.6.0__py3-none-any.whl

mistralai 1.5.2py3-none-any.whl → 1.6.0py3-none-any.whl