PyPI - mistralai - Versions diffs - 1.9.10__py3-none-any.whl → 1.10.0__py3-none-any.whl - Mend

mistralai 1.9.10py3-none-any.whl → 1.10.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

mistralai/_hooks/registration.py +5 -0
mistralai/_hooks/tracing.py +50 -0
mistralai/_version.py +3 -3
mistralai/accesses.py +51 -116
mistralai/agents.py +58 -85
mistralai/audio.py +8 -3
mistralai/basesdk.py +15 -5
mistralai/batch.py +6 -3
mistralai/beta.py +10 -5
mistralai/chat.py +70 -97
mistralai/classifiers.py +57 -144
mistralai/conversations.py +435 -412
mistralai/documents.py +156 -359
mistralai/embeddings.py +21 -42
mistralai/extra/observability/__init__.py +15 -0
mistralai/extra/observability/otel.py +393 -0
mistralai/extra/run/tools.py +28 -16
mistralai/files.py +53 -176
mistralai/fim.py +46 -73
mistralai/fine_tuning.py +6 -3
mistralai/jobs.py +49 -158
mistralai/libraries.py +71 -178
mistralai/mistral_agents.py +298 -179
mistralai/mistral_jobs.py +51 -138
mistralai/models/__init__.py +94 -5
mistralai/models/agent.py +15 -2
mistralai/models/agentconversation.py +11 -3
mistralai/models/agentcreationrequest.py +6 -2
mistralai/models/agents_api_v1_agents_deleteop.py +16 -0
mistralai/models/agents_api_v1_agents_getop.py +40 -3
mistralai/models/agents_api_v1_agents_listop.py +72 -2
mistralai/models/agents_api_v1_conversations_deleteop.py +18 -0
mistralai/models/agents_api_v1_conversations_listop.py +39 -2
mistralai/models/agentscompletionrequest.py +21 -6
mistralai/models/agentscompletionstreamrequest.py +21 -6
mistralai/models/agentupdaterequest.py +18 -2
mistralai/models/audiotranscriptionrequest.py +2 -0
mistralai/models/batchjobin.py +10 -0
mistralai/models/chatcompletionrequest.py +22 -5
mistralai/models/chatcompletionstreamrequest.py +22 -5
mistralai/models/conversationrequest.py +15 -4
mistralai/models/conversationrestartrequest.py +50 -2
mistralai/models/conversationrestartstreamrequest.py +50 -2
mistralai/models/conversationstreamrequest.py +15 -4
mistralai/models/documentout.py +26 -10
mistralai/models/documentupdatein.py +24 -3
mistralai/models/embeddingrequest.py +8 -8
mistralai/models/files_api_routes_list_filesop.py +7 -0
mistralai/models/fimcompletionrequest.py +8 -9
mistralai/models/fimcompletionstreamrequest.py +8 -9
mistralai/models/httpvalidationerror.py +11 -6
mistralai/models/libraries_documents_list_v1op.py +15 -2
mistralai/models/libraryout.py +10 -7
mistralai/models/listfilesout.py +35 -4
mistralai/models/mistralerror.py +26 -0
mistralai/models/modelcapabilities.py +13 -4
mistralai/models/modelconversation.py +8 -2
mistralai/models/no_response_error.py +13 -0
mistralai/models/ocrpageobject.py +26 -5
mistralai/models/ocrrequest.py +17 -1
mistralai/models/ocrtableobject.py +31 -0
mistralai/models/prediction.py +4 -0
mistralai/models/requestsource.py +7 -0
mistralai/models/responseformat.py +4 -2
mistralai/models/responseformats.py +0 -1
mistralai/models/responsevalidationerror.py +25 -0
mistralai/models/sdkerror.py +30 -14
mistralai/models/sharingdelete.py +36 -5
mistralai/models/sharingin.py +36 -5
mistralai/models/sharingout.py +3 -3
mistralai/models/toolexecutiondeltaevent.py +13 -4
mistralai/models/toolexecutiondoneevent.py +13 -4
mistralai/models/toolexecutionentry.py +9 -4
mistralai/models/toolexecutionstartedevent.py +13 -4
mistralai/models_.py +67 -212
mistralai/ocr.py +33 -36
mistralai/sdk.py +15 -2
mistralai/transcriptions.py +21 -60
mistralai/utils/__init__.py +18 -5
mistralai/utils/eventstreaming.py +10 -0
mistralai/utils/serializers.py +3 -2
mistralai/utils/unmarshal_json_response.py +24 -0
{mistralai-1.9.10.dist-info → mistralai-1.10.0.dist-info}/METADATA +89 -40
{mistralai-1.9.10.dist-info → mistralai-1.10.0.dist-info}/RECORD +86 -75
{mistralai-1.9.10.dist-info → mistralai-1.10.0.dist-info}/WHEEL +1 -1
{mistralai-1.9.10.dist-info → mistralai-1.10.0.dist-info/licenses}/LICENSE +0 -0

mistralai/embeddings.py CHANGED Viewed

@@ -5,6 +5,7 @@ from mistralai import models, utils
 from mistralai._hooks import HookContext
 from mistralai.types import OptionalNullable, UNSET
 from mistralai.utils import get_security_from_env
+from mistralai.utils.unmarshal_json_response import unmarshal_json_response
 from typing import Any, Mapping, Optional, Union
@@ -30,9 +31,9 @@ class Embeddings(BaseSDK):
         Embeddings
-        :param model: ID of the model to use.
-        :param inputs: Text to embed.
-        :param output_dimension: The dimension of the output embeddings.
+        :param model: The ID of the model to be used for embedding.
+        :param inputs: The text content to be embedded, can be a string or an array of strings for fast processing in bulk.
+        :param output_dimension: The dimension of the output embeddings when feature available. If not provided, a default output dimension will be used.
         :param output_dtype:
         :param encoding_format:
         :param retries: Override the default retry configuration for this method
@@ -102,31 +103,20 @@ class Embeddings(BaseSDK):
         response_data: Any = None
         if utils.match_response(http_res, "200", "application/json"):
-            return utils.unmarshal_json(http_res.text, models.EmbeddingResponse)
+            return unmarshal_json_response(models.EmbeddingResponse, http_res)
         if utils.match_response(http_res, "422", "application/json"):
-            response_data = utils.unmarshal_json(
-                http_res.text, models.HTTPValidationErrorData
+            response_data = unmarshal_json_response(
+                models.HTTPValidationErrorData, http_res
             )
-            raise models.HTTPValidationError(data=response_data)
+            raise models.HTTPValidationError(response_data, http_res)
         if utils.match_response(http_res, "4XX", "*"):
             http_res_text = utils.stream_to_text(http_res)
-            raise models.SDKError(
-                "API error occurred", http_res.status_code, http_res_text, http_res
-            )
+            raise models.SDKError("API error occurred", http_res, http_res_text)
         if utils.match_response(http_res, "5XX", "*"):
             http_res_text = utils.stream_to_text(http_res)
-            raise models.SDKError(
-                "API error occurred", http_res.status_code, http_res_text, http_res
-            )
+            raise models.SDKError("API error occurred", http_res, http_res_text)
-        content_type = http_res.headers.get("Content-Type")
-        http_res_text = utils.stream_to_text(http_res)
-        raise models.SDKError(
-            f"Unexpected response received (code: {http_res.status_code}, type: {content_type})",
-            http_res.status_code,
-            http_res_text,
-            http_res,
-        )
+        raise models.SDKError("Unexpected response received", http_res)
     async def create_async(
         self,
@@ -147,9 +137,9 @@ class Embeddings(BaseSDK):
         Embeddings
-        :param model: ID of the model to use.
-        :param inputs: Text to embed.
-        :param output_dimension: The dimension of the output embeddings.
+        :param model: The ID of the model to be used for embedding.
+        :param inputs: The text content to be embedded, can be a string or an array of strings for fast processing in bulk.
+        :param output_dimension: The dimension of the output embeddings when feature available. If not provided, a default output dimension will be used.
         :param output_dtype:
         :param encoding_format:
         :param retries: Override the default retry configuration for this method
@@ -219,28 +209,17 @@ class Embeddings(BaseSDK):
         response_data: Any = None
         if utils.match_response(http_res, "200", "application/json"):
-            return utils.unmarshal_json(http_res.text, models.EmbeddingResponse)
+            return unmarshal_json_response(models.EmbeddingResponse, http_res)
         if utils.match_response(http_res, "422", "application/json"):
-            response_data = utils.unmarshal_json(
-                http_res.text, models.HTTPValidationErrorData
+            response_data = unmarshal_json_response(
+                models.HTTPValidationErrorData, http_res
             )
-            raise models.HTTPValidationError(data=response_data)
+            raise models.HTTPValidationError(response_data, http_res)
         if utils.match_response(http_res, "4XX", "*"):
             http_res_text = await utils.stream_to_text_async(http_res)
-            raise models.SDKError(
-                "API error occurred", http_res.status_code, http_res_text, http_res
-            )
+            raise models.SDKError("API error occurred", http_res, http_res_text)
         if utils.match_response(http_res, "5XX", "*"):
             http_res_text = await utils.stream_to_text_async(http_res)
-            raise models.SDKError(
-                "API error occurred", http_res.status_code, http_res_text, http_res
-            )
+            raise models.SDKError("API error occurred", http_res, http_res_text)
-        content_type = http_res.headers.get("Content-Type")
-        http_res_text = await utils.stream_to_text_async(http_res)
-        raise models.SDKError(
-            f"Unexpected response received (code: {http_res.status_code}, type: {content_type})",
-            http_res.status_code,
-            http_res_text,
-            http_res,
-        )
+        raise models.SDKError("Unexpected response received", http_res)

mistralai/extra/observability/__init__.py ADDED Viewed

@@ -0,0 +1,15 @@
+from contextlib import contextmanager
+from opentelemetry import trace as otel_trace
+from .otel import MISTRAL_SDK_OTEL_TRACER_NAME
+@contextmanager
+def trace(name: str, **kwargs):
+    tracer = otel_trace.get_tracer(MISTRAL_SDK_OTEL_TRACER_NAME)
+    with tracer.start_as_current_span(name, **kwargs) as span:
+        yield span
+__all__ = ["trace"]

mistralai/extra/observability/otel.py ADDED Viewed

@@ -0,0 +1,393 @@
+import copy
+import json
+import logging
+import os
+import traceback
+from datetime import datetime, timezone
+from enum import Enum
+from typing import Optional, Tuple
+import httpx
+import opentelemetry.semconv._incubating.attributes.gen_ai_attributes as gen_ai_attributes
+import opentelemetry.semconv._incubating.attributes.http_attributes as http_attributes
+import opentelemetry.semconv.attributes.server_attributes as server_attributes
+from opentelemetry import propagate, trace
+from opentelemetry.exporter.otlp.proto.http.trace_exporter import OTLPSpanExporter
+from opentelemetry.sdk.resources import SERVICE_NAME, Resource
+from opentelemetry.sdk.trace import SpanProcessor, TracerProvider
+from opentelemetry.sdk.trace.export import BatchSpanProcessor, SpanExportResult
+from opentelemetry.trace import Span, Status, StatusCode, Tracer, set_span_in_context
+logger = logging.getLogger(__name__)
+OTEL_SERVICE_NAME: str = "mistralai_sdk"
+OTEL_EXPORTER_OTLP_ENDPOINT: str = os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT", "")
+OTEL_EXPORTER_OTLP_TIMEOUT: int = int(os.getenv("OTEL_EXPORTER_OTLP_TIMEOUT", "2"))
+OTEL_EXPORTER_OTLP_MAX_EXPORT_BATCH_SIZE: int = int(os.getenv("OTEL_EXPORTER_OTLP_MAX_EXPORT_BATCH_SIZE", "512"))
+OTEL_EXPORTER_OTLP_SCHEDULE_DELAY_MILLIS: int = int(os.getenv("OTEL_EXPORTER_OTLP_SCHEDULE_DELAY_MILLIS", "1000"))
+OTEL_EXPORTER_OTLP_MAX_QUEUE_SIZE: int = int(os.getenv("OTEL_EXPORTER_OTLP_MAX_QUEUE_SIZE", "2048"))
+OTEL_EXPORTER_OTLP_EXPORT_TIMEOUT_MILLIS: int = int(os.getenv("OTEL_EXPORTER_OTLP_EXPORT_TIMEOUT_MILLIS", "5000"))
+MISTRAL_SDK_OTEL_TRACER_NAME: str = OTEL_SERVICE_NAME + "_tracer"
+MISTRAL_SDK_DEBUG_TRACING: bool = os.getenv("MISTRAL_SDK_DEBUG_TRACING", "false").lower() == "true"
+DEBUG_HINT: str = "To see detailed exporter logs, set MISTRAL_SDK_DEBUG_TRACING=true."
+class MistralAIAttributes:
+    MISTRAL_AI_TOTAL_TOKENS = "mistral_ai.request.total_tokens"
+    MISTRAL_AI_TOOL_CALL_ARGUMENTS = "mistral_ai.tool.call.arguments"
+    MISTRAL_AI_MESSAGE_ID = "mistral_ai.message.id"
+    MISTRAL_AI_OPERATION_NAME= "mistral_ai.operation.name"
+    MISTRAL_AI_OCR_USAGE_PAGES_PROCESSED = "mistral_ai.ocr.usage.pages_processed"
+    MISTRAL_AI_OCR_USAGE_DOC_SIZE_BYTES = "mistral_ai.ocr.usage.doc_size_bytes"
+    MISTRAL_AI_OPERATION_ID = "mistral_ai.operation.id"
+    MISTRAL_AI_ERROR_TYPE = "mistral_ai.error.type"
+    MISTRAL_AI_ERROR_MESSAGE = "mistral_ai.error.message"
+    MISTRAL_AI_ERROR_CODE = "mistral_ai.error.code"
+    MISTRAL_AI_FUNCTION_CALL_ARGUMENTS = "mistral_ai.function.call.arguments"
+class MistralAINameValues(Enum):
+    OCR = "ocr"
+class TracingErrors(Exception, Enum):
+    FAILED_TO_EXPORT_OTEL_SPANS = "Failed to export OpenTelemetry (OTEL) spans."
+    FAILED_TO_INITIALIZE_OPENTELEMETRY_TRACING = "Failed to initialize OpenTelemetry tracing."
+    FAILED_TO_CREATE_SPAN_FOR_REQUEST = "Failed to create span for request."
+    FAILED_TO_ENRICH_SPAN_WITH_RESPONSE = "Failed to enrich span with response."
+    FAILED_TO_HANDLE_ERROR_IN_SPAN = "Failed to handle error in span."
+    FAILED_TO_END_SPAN = "Failed to end span."
+    def __str__(self):
+        return str(self.value)
+class GenAISpanEnum(str, Enum):
+    CONVERSATION = "conversation"
+    CONV_REQUEST = "POST /v1/conversations"
+    EXECUTE_TOOL = "execute_tool"
+    VALIDATE_RUN = "validate_run"
+    @staticmethod
+    def function_call(func_name: str):
+        return f"function_call[{func_name}]"
+def parse_time_to_nanos(ts: str) -> int:
+    dt = datetime.fromisoformat(ts.replace("Z", "+00:00")).astimezone(timezone.utc)
+    return int(dt.timestamp() * 1e9)
+def set_available_attributes(span: Span, attributes: dict) -> None:
+    for attribute, value in attributes.items():
+        if value:
+            span.set_attribute(attribute, value)
+def enrich_span_from_request(span: Span, request: httpx.Request) -> Span:
+    if not request.url.port:
+        # From httpx doc:
+        # Note that the URL class performs port normalization as per the WHATWG spec.
+        # Default ports for "http", "https", "ws", "wss", and "ftp" schemes are always treated as None.
+        # Handling default ports since most of the time we are using https
+        if request.url.scheme == "https":
+            port = 443
+        elif request.url.scheme == "http":
+            port = 80
+        else:
+            port = -1
+    else:
+        port = request.url.port
+    span.set_attributes({
+        http_attributes.HTTP_REQUEST_METHOD: request.method,
+        http_attributes.HTTP_URL: str(request.url),
+        server_attributes.SERVER_ADDRESS: request.headers.get("host", ""),
+        server_attributes.SERVER_PORT: port
+    })
+    if request._content:
+        request_body = json.loads(request._content)
+        attributes = {
+            gen_ai_attributes.GEN_AI_REQUEST_CHOICE_COUNT: request_body.get("n", None),
+            gen_ai_attributes.GEN_AI_REQUEST_ENCODING_FORMATS: request_body.get("encoding_formats", None),
+            gen_ai_attributes.GEN_AI_REQUEST_FREQUENCY_PENALTY: request_body.get("frequency_penalty", None),
+            gen_ai_attributes.GEN_AI_REQUEST_MAX_TOKENS: request_body.get("max_tokens", None),
+            gen_ai_attributes.GEN_AI_REQUEST_MODEL: request_body.get("model", None),
+            gen_ai_attributes.GEN_AI_REQUEST_PRESENCE_PENALTY: request_body.get("presence_penalty", None),
+            gen_ai_attributes.GEN_AI_REQUEST_SEED: request_body.get("random_seed", None),
+            gen_ai_attributes.GEN_AI_REQUEST_STOP_SEQUENCES: request_body.get("stop", None),
+            gen_ai_attributes.GEN_AI_REQUEST_TEMPERATURE: request_body.get("temperature", None),
+            gen_ai_attributes.GEN_AI_REQUEST_TOP_P: request_body.get("top_p", None),
+            gen_ai_attributes.GEN_AI_REQUEST_TOP_K: request_body.get("top_k", None),
+            # Input messages are likely to be large, containing user/PII data and other sensitive information.
+            # Also structured attributes are not yet supported on spans in Python.
+            # For those reasons, we will not record the input messages for now.
+            gen_ai_attributes.GEN_AI_INPUT_MESSAGES: None,
+        }
+        # Set attributes only if they are not None.
+        # From OpenTelemetry documentation: None is not a valid attribute value per spec / is not a permitted value type for an attribute.
+        set_available_attributes(span, attributes)
+    return span
+def enrich_span_from_response(tracer: trace.Tracer, span: Span, operation_id: str, response: httpx.Response) -> None:
+    span.set_status(Status(StatusCode.OK))
+    response_data = json.loads(response.content)
+    # Base attributes
+    attributes: dict[str, str | int] = {
+        http_attributes.HTTP_RESPONSE_STATUS_CODE: response.status_code,
+        MistralAIAttributes.MISTRAL_AI_OPERATION_ID: operation_id,
+        gen_ai_attributes.GEN_AI_PROVIDER_NAME: gen_ai_attributes.GenAiProviderNameValues.MISTRAL_AI.value
+    }
+    # Add usage attributes if available
+    usage = response_data.get("usage", {})
+    if usage:
+        attributes.update({
+            gen_ai_attributes.GEN_AI_USAGE_PROMPT_TOKENS: usage.get("prompt_tokens", 0),
+            gen_ai_attributes.GEN_AI_USAGE_OUTPUT_TOKENS: usage.get("completion_tokens", 0),
+            MistralAIAttributes.MISTRAL_AI_TOTAL_TOKENS: usage.get("total_tokens", 0)
+        })
+    span.set_attributes(attributes)
+    if operation_id == "agents_api_v1_agents_create":
+        # Semantics from https://opentelemetry.io/docs/specs/semconv/gen-ai/gen-ai-agent-spans/#create-agent-span
+        agent_attributes = {
+            gen_ai_attributes.GEN_AI_OPERATION_NAME: gen_ai_attributes.GenAiOperationNameValues.CREATE_AGENT.value,
+            gen_ai_attributes.GEN_AI_AGENT_DESCRIPTION: response_data.get("description", ""),
+            gen_ai_attributes.GEN_AI_AGENT_ID: response_data.get("id", ""),
+            gen_ai_attributes.GEN_AI_AGENT_NAME: response_data.get("name", ""),
+            gen_ai_attributes.GEN_AI_REQUEST_MODEL: response_data.get("model", ""),
+            gen_ai_attributes.GEN_AI_SYSTEM_INSTRUCTIONS: response_data.get("instructions", "")
+        }
+        span.set_attributes(agent_attributes)
+    if operation_id in ["agents_api_v1_conversations_start", "agents_api_v1_conversations_append"]:
+        outputs = response_data.get("outputs", [])
+        conversation_attributes = {
+            gen_ai_attributes.GEN_AI_OPERATION_NAME: gen_ai_attributes.GenAiOperationNameValues.INVOKE_AGENT.value,
+            gen_ai_attributes.GEN_AI_CONVERSATION_ID: response_data.get("conversation_id", "")
+        }
+        span.set_attributes(conversation_attributes)
+        parent_context = set_span_in_context(span)
+        for output in outputs:
+            # TODO: Only enrich the spans if it's a single turn conversation.
+            # Multi turn conversations are handled in the extra.run.tools.create_function_result function
+            if output["type"] == "function.call":
+                pass
+            if output["type"] == "tool.execution":
+                start_ns = parse_time_to_nanos(output["created_at"])
+                end_ns = parse_time_to_nanos(output["completed_at"])
+                child_span = tracer.start_span("Tool Execution", start_time=start_ns, context=parent_context)
+                tool_attributes = {
+                    gen_ai_attributes.GEN_AI_OPERATION_NAME: gen_ai_attributes.GenAiOperationNameValues.EXECUTE_TOOL.value,
+                    gen_ai_attributes.GEN_AI_TOOL_CALL_ID: output.get("id", ""),
+                    MistralAIAttributes.MISTRAL_AI_TOOL_CALL_ARGUMENTS: output.get("arguments", ""),
+                    gen_ai_attributes.GEN_AI_TOOL_NAME: output.get("name", "")
+                }
+                child_span.set_attributes(tool_attributes)
+                child_span.end(end_time=end_ns)
+            if output["type"] == "message.output":
+                start_ns = parse_time_to_nanos(output["created_at"])
+                end_ns = parse_time_to_nanos(output["completed_at"])
+                child_span = tracer.start_span("Message Output", start_time=start_ns, context=parent_context)
+                message_attributes = {
+                    gen_ai_attributes.GEN_AI_OPERATION_NAME: gen_ai_attributes.GenAiOperationNameValues.CHAT.value,
+                    gen_ai_attributes.GEN_AI_PROVIDER_NAME: gen_ai_attributes.GenAiProviderNameValues.MISTRAL_AI.value,
+                    MistralAIAttributes.MISTRAL_AI_MESSAGE_ID: output.get("id", ""),
+                    gen_ai_attributes.GEN_AI_AGENT_ID: output.get("agent_id", ""),
+                    gen_ai_attributes.GEN_AI_REQUEST_MODEL: output.get("model", "")
+                }
+                child_span.set_attributes(message_attributes)
+                child_span.end(end_time=end_ns)
+    if operation_id == "ocr_v1_ocr_post":
+        usage_info = response_data.get("usage_info", "")
+        ocr_attributes = {
+            MistralAIAttributes.MISTRAL_AI_OPERATION_NAME: MistralAINameValues.OCR.value,
+            MistralAIAttributes.MISTRAL_AI_OCR_USAGE_PAGES_PROCESSED: usage_info.get("pages_processed", "") if usage_info else "",
+            MistralAIAttributes.MISTRAL_AI_OCR_USAGE_DOC_SIZE_BYTES: usage_info.get("doc_size_bytes", "") if usage_info else "",
+            gen_ai_attributes.GEN_AI_REQUEST_MODEL: response_data.get("model", "")
+        }
+        span.set_attributes(ocr_attributes)
+class GenAISpanProcessor(SpanProcessor):
+    def on_start(self, span, parent_context = None):
+        span.set_attributes({"agent.trace.public": ""})
+class QuietOTLPSpanExporter(OTLPSpanExporter):
+    def export(self, spans):
+        try:
+            return super().export(spans)
+        except Exception:
+            logger.warning(f"{TracingErrors.FAILED_TO_EXPORT_OTEL_SPANS} {(traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT)}")
+            return SpanExportResult.FAILURE
+def get_or_create_otel_tracer() -> Tuple[bool, Tracer]:
+    """
+    3 possible cases:
+    -> [SDK in a Workflow / App] If there is already a tracer provider set -> use that one
+    -> [SDK standalone] If no tracer provider is set but the OTEL_EXPORTER_OTLP_ENDPOINT is set -> create a new tracer provider that exports to the OTEL_EXPORTER_OTLP_ENDPOINT
+    -> Else tracing is disabled
+    """
+    tracing_enabled = True
+    tracer_provider = trace.get_tracer_provider()
+    if isinstance(tracer_provider, trace.ProxyTracerProvider):
+        if OTEL_EXPORTER_OTLP_ENDPOINT:
+            # SDK standalone: No tracer provider but OTEL_EXPORTER_OTLP_ENDPOINT is set -> create a new tracer provider that exports to the OTEL_EXPORTER_OTLP_ENDPOINT
+            try:
+                exporter = QuietOTLPSpanExporter(
+                    endpoint=OTEL_EXPORTER_OTLP_ENDPOINT,
+                    timeout=OTEL_EXPORTER_OTLP_TIMEOUT
+                )
+                resource = Resource.create(attributes={SERVICE_NAME: OTEL_SERVICE_NAME})
+                tracer_provider = TracerProvider(resource=resource)
+                span_processor = BatchSpanProcessor(
+                    exporter,
+                    export_timeout_millis=OTEL_EXPORTER_OTLP_EXPORT_TIMEOUT_MILLIS,
+                    max_export_batch_size=OTEL_EXPORTER_OTLP_MAX_EXPORT_BATCH_SIZE,
+                    schedule_delay_millis=OTEL_EXPORTER_OTLP_SCHEDULE_DELAY_MILLIS,
+                    max_queue_size=OTEL_EXPORTER_OTLP_MAX_QUEUE_SIZE
+                )
+                tracer_provider.add_span_processor(span_processor)
+                tracer_provider.add_span_processor(GenAISpanProcessor())
+                trace.set_tracer_provider(tracer_provider)
+            except Exception:
+                logger.warning(f"{TracingErrors.FAILED_TO_INITIALIZE_OPENTELEMETRY_TRACING} {(traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT)}")
+                tracing_enabled = False
+        else:
+            # No tracer provider nor OTEL_EXPORTER_OTLP_ENDPOINT set -> tracing is disabled
+            tracing_enabled = False
+    tracer = tracer_provider.get_tracer(MISTRAL_SDK_OTEL_TRACER_NAME)
+    return tracing_enabled, tracer
+def get_traced_request_and_span(tracing_enabled: bool, tracer: Tracer, span: Optional[Span], operation_id: str, request: httpx.Request) -> Tuple[httpx.Request, Optional[Span]]:
+        if not tracing_enabled:
+            return request, span
+        try:
+            span = tracer.start_span(name=operation_id)
+            # Inject the span context into the request headers to be used by the backend service to continue the trace
+            propagate.inject(request.headers)
+            span = enrich_span_from_request(span, request)
+        except Exception:
+            logger.warning(
+                "%s %s",
+                TracingErrors.FAILED_TO_CREATE_SPAN_FOR_REQUEST,
+                traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT,
+            )
+            if span:
+                end_span(span=span)
+            span = None
+        return request, span
+def get_traced_response(tracing_enabled: bool, tracer: Tracer, span: Optional[Span], operation_id: str, response: httpx.Response) -> httpx.Response:
+    if not tracing_enabled or not span:
+        return response
+    try:
+        is_stream_response = not response.is_closed and not response.is_stream_consumed
+        if is_stream_response:
+            return TracedResponse.from_response(resp=response, span=span)
+        enrich_span_from_response(
+            tracer, span, operation_id, response
+        )
+    except Exception:
+        logger.warning(
+            "%s %s",
+            TracingErrors.FAILED_TO_ENRICH_SPAN_WITH_RESPONSE,
+            traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT,
+        )
+    if span:
+        end_span(span=span)
+    return response
+def get_response_and_error(tracing_enabled: bool, tracer: Tracer, span: Optional[Span], operation_id: str, response: httpx.Response, error: Optional[Exception]) -> Tuple[httpx.Response, Optional[Exception]]:
+        if not tracing_enabled or not span:
+            return response, error
+        try:
+            if error:
+                span.record_exception(error)
+                span.set_status(Status(StatusCode.ERROR, str(error)))
+            if hasattr(response, "_content") and response._content:
+                response_body = json.loads(response._content)
+                if response_body.get("object", "") == "error":
+                    if error_msg := response_body.get("message", ""):
+                        attributes = {
+                            http_attributes.HTTP_RESPONSE_STATUS_CODE: response.status_code,
+                            MistralAIAttributes.MISTRAL_AI_ERROR_TYPE: response_body.get("type", ""),
+                            MistralAIAttributes.MISTRAL_AI_ERROR_MESSAGE: error_msg,
+                            MistralAIAttributes.MISTRAL_AI_ERROR_CODE: response_body.get("code", ""),
+                        }
+                        for attribute, value in attributes.items():
+                            if value:
+                                span.set_attribute(attribute, value)
+            span.end()
+            span = None
+        except Exception:
+            logger.warning(
+                "%s %s",
+                TracingErrors.FAILED_TO_HANDLE_ERROR_IN_SPAN,
+                traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT,
+            )
+            if span:
+                span.end()
+                span = None
+        return response, error
+def end_span(span: Span) -> None:
+    try:
+        span.end()
+    except Exception:
+        logger.warning(
+            "%s %s",
+            TracingErrors.FAILED_TO_END_SPAN,
+            traceback.format_exc() if MISTRAL_SDK_DEBUG_TRACING else DEBUG_HINT,
+        )
+class TracedResponse(httpx.Response):
+    """
+    TracedResponse is a subclass of httpx.Response that ends the span when the response is closed.
+    This hack allows ending the span only once the stream is fully consumed.
+    """
+    def __init__(self, *args, span: Optional[Span], **kwargs) -> None:
+        super().__init__(*args, **kwargs)
+        self.span = span
+    def close(self) -> None:
+        if self.span:
+            end_span(span=self.span)
+        super().close()
+    async def aclose(self) -> None:
+        if self.span:
+            end_span(span=self.span)
+        await super().aclose()
+    @classmethod
+    def from_response(cls, resp: httpx.Response, span: Optional[Span]) -> "TracedResponse":
+        traced_resp = cls.__new__(cls)
+        traced_resp.__dict__ = copy.copy(resp.__dict__)
+        traced_resp.span = span
+        # Warning: this syntax bypasses the __init__ method.
+        # If you add init logic in the TracedResponse.__init__ method, you will need to add the following line for it to execute:
+        # traced_resp.__init__(your_arguments)
+        return traced_resp

mistralai/extra/run/tools.py CHANGED Viewed

@@ -8,6 +8,7 @@ from pydantic.fields import FieldInfo
 import json
 from typing import cast, Callable, Sequence, Any, ForwardRef, get_type_hints, Union
+from opentelemetry import trace
 from griffe import (
     Docstring,
     DocstringSectionKind,
@@ -15,9 +16,11 @@ from griffe import (
     DocstringParameter,
     DocstringSection,
 )
+import opentelemetry.semconv._incubating.attributes.gen_ai_attributes as gen_ai_attributes
 from mistralai.extra.exceptions import RunException
 from mistralai.extra.mcp.base import MCPClientProtocol
+from mistralai.extra.observability.otel import GenAISpanEnum, MistralAIAttributes, set_available_attributes
 from mistralai.extra.run.result import RunOutputEntries
 from mistralai.models import (
     FunctionResultEntry,
@@ -191,22 +194,31 @@ async def create_function_result(
         if isinstance(function_call.arguments, str)
         else function_call.arguments
     )
-    try:
-        if isinstance(run_tool, RunFunction):
-            res = run_tool.callable(**arguments)
-        elif isinstance(run_tool, RunCoroutine):
-            res = await run_tool.awaitable(**arguments)
-        elif isinstance(run_tool, RunMCPTool):
-            res = await run_tool.mcp_client.execute_tool(function_call.name, arguments)
-    except Exception as e:
-        if continue_on_fn_error is True:
-            return FunctionResultEntry(
-                tool_call_id=function_call.tool_call_id,
-                result=f"Error while executing {function_call.name}: {str(e)}",
-            )
-        raise RunException(
-            f"Failed to execute tool {function_call.name} with arguments '{function_call.arguments}'"
-        ) from e
+    tracer = trace.get_tracer(__name__)
+    with tracer.start_as_current_span(GenAISpanEnum.function_call(function_call.name)) as span:
+        try:
+            if isinstance(run_tool, RunFunction):
+                res = run_tool.callable(**arguments)
+            elif isinstance(run_tool, RunCoroutine):
+                res = await run_tool.awaitable(**arguments)
+            elif isinstance(run_tool, RunMCPTool):
+                res = await run_tool.mcp_client.execute_tool(function_call.name, arguments)
+            function_call_attributes = {
+                    gen_ai_attributes.GEN_AI_OPERATION_NAME: gen_ai_attributes.GenAiOperationNameValues.EXECUTE_TOOL.value,
+                    gen_ai_attributes.GEN_AI_TOOL_CALL_ID: function_call.id,
+                    MistralAIAttributes.MISTRAL_AI_TOOL_CALL_ARGUMENTS: str(function_call.arguments),
+                    gen_ai_attributes.GEN_AI_TOOL_NAME: function_call.name
+                }
+            set_available_attributes(span, function_call_attributes)
+        except Exception as e:
+            if continue_on_fn_error is True:
+                return FunctionResultEntry(
+                    tool_call_id=function_call.tool_call_id,
+                    result=f"Error while executing {function_call.name}: {str(e)}",
+                )
+            raise RunException(
+                f"Failed to execute tool {function_call.name} with arguments '{function_call.arguments}'"
+            ) from e
     return FunctionResultEntry(
         tool_call_id=function_call.tool_call_id,

mistralai 1.9.10__py3-none-any.whl → 1.10.0__py3-none-any.whl

mistralai 1.9.10py3-none-any.whl → 1.10.0py3-none-any.whl