PyPI - openlit - Versions diffs - 1.34.30__py3-none-any.whl → 1.34.32__py3-none-any.whl - Mend

openlit 1.34.30py3-none-any.whl → 1.34.32py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

openlit/__helpers.py +235 -86
openlit/__init__.py +19 -14
openlit/_instrumentors.py +2 -1
openlit/evals/all.py +50 -21
openlit/evals/bias_detection.py +47 -20
openlit/evals/hallucination.py +53 -22
openlit/evals/toxicity.py +50 -21
openlit/evals/utils.py +54 -30
openlit/guard/all.py +61 -19
openlit/guard/prompt_injection.py +34 -14
openlit/guard/restrict_topic.py +46 -15
openlit/guard/sensitive_topic.py +34 -14
openlit/guard/utils.py +58 -22
openlit/instrumentation/ag2/__init__.py +113 -6
openlit/instrumentation/ag2/ag2.py +459 -17
openlit/instrumentation/ag2/async_ag2.py +459 -17
openlit/instrumentation/ag2/utils.py +475 -31
openlit/instrumentation/ai21/__init__.py +43 -14
openlit/instrumentation/ai21/ai21.py +47 -21
openlit/instrumentation/ai21/async_ai21.py +47 -21
openlit/instrumentation/ai21/utils.py +299 -78
openlit/instrumentation/anthropic/__init__.py +21 -4
openlit/instrumentation/anthropic/anthropic.py +28 -17
openlit/instrumentation/anthropic/async_anthropic.py +28 -17
openlit/instrumentation/anthropic/utils.py +145 -35
openlit/instrumentation/assemblyai/__init__.py +11 -2
openlit/instrumentation/assemblyai/assemblyai.py +15 -4
openlit/instrumentation/assemblyai/utils.py +120 -25
openlit/instrumentation/astra/__init__.py +43 -10
openlit/instrumentation/astra/astra.py +28 -5
openlit/instrumentation/astra/async_astra.py +28 -5
openlit/instrumentation/astra/utils.py +151 -55
openlit/instrumentation/azure_ai_inference/__init__.py +43 -10
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/utils.py +307 -83
openlit/instrumentation/bedrock/__init__.py +21 -4
openlit/instrumentation/bedrock/bedrock.py +63 -25
openlit/instrumentation/bedrock/utils.py +139 -30
openlit/instrumentation/chroma/__init__.py +89 -16
openlit/instrumentation/chroma/chroma.py +28 -6
openlit/instrumentation/chroma/utils.py +167 -51
openlit/instrumentation/cohere/__init__.py +63 -18
openlit/instrumentation/cohere/async_cohere.py +63 -24
openlit/instrumentation/cohere/cohere.py +63 -24
openlit/instrumentation/cohere/utils.py +286 -73
openlit/instrumentation/controlflow/__init__.py +35 -9
openlit/instrumentation/controlflow/controlflow.py +66 -33
openlit/instrumentation/crawl4ai/__init__.py +25 -10
openlit/instrumentation/crawl4ai/async_crawl4ai.py +78 -31
openlit/instrumentation/crawl4ai/crawl4ai.py +78 -31
openlit/instrumentation/crewai/__init__.py +40 -15
openlit/instrumentation/crewai/async_crewai.py +32 -7
openlit/instrumentation/crewai/crewai.py +32 -7
openlit/instrumentation/crewai/utils.py +159 -56
openlit/instrumentation/dynamiq/__init__.py +46 -12
openlit/instrumentation/dynamiq/dynamiq.py +74 -33
openlit/instrumentation/elevenlabs/__init__.py +23 -4
openlit/instrumentation/elevenlabs/async_elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/utils.py +128 -25
openlit/instrumentation/embedchain/__init__.py +11 -2
openlit/instrumentation/embedchain/embedchain.py +68 -35
openlit/instrumentation/firecrawl/__init__.py +24 -7
openlit/instrumentation/firecrawl/firecrawl.py +46 -20
openlit/instrumentation/google_ai_studio/__init__.py +45 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/utils.py +180 -67
openlit/instrumentation/gpt4all/__init__.py +22 -7
openlit/instrumentation/gpt4all/gpt4all.py +67 -29
openlit/instrumentation/gpt4all/utils.py +285 -61
openlit/instrumentation/gpu/__init__.py +128 -47
openlit/instrumentation/groq/__init__.py +21 -4
openlit/instrumentation/groq/async_groq.py +33 -21
openlit/instrumentation/groq/groq.py +33 -21
openlit/instrumentation/groq/utils.py +192 -55
openlit/instrumentation/haystack/__init__.py +70 -24
openlit/instrumentation/haystack/async_haystack.py +28 -6
openlit/instrumentation/haystack/haystack.py +28 -6
openlit/instrumentation/haystack/utils.py +196 -74
openlit/instrumentation/julep/__init__.py +69 -19
openlit/instrumentation/julep/async_julep.py +53 -27
openlit/instrumentation/julep/julep.py +53 -28
openlit/instrumentation/langchain/__init__.py +74 -63
openlit/instrumentation/langchain/callback_handler.py +1100 -0
openlit/instrumentation/langchain_community/__init__.py +13 -2
openlit/instrumentation/langchain_community/async_langchain_community.py +23 -5
openlit/instrumentation/langchain_community/langchain_community.py +23 -5
openlit/instrumentation/langchain_community/utils.py +35 -9
openlit/instrumentation/letta/__init__.py +68 -15
openlit/instrumentation/letta/letta.py +99 -54
openlit/instrumentation/litellm/__init__.py +43 -14
openlit/instrumentation/litellm/async_litellm.py +51 -26
openlit/instrumentation/litellm/litellm.py +51 -26
openlit/instrumentation/litellm/utils.py +304 -102
openlit/instrumentation/llamaindex/__init__.py +267 -90
openlit/instrumentation/llamaindex/async_llamaindex.py +28 -6
openlit/instrumentation/llamaindex/llamaindex.py +28 -6
openlit/instrumentation/llamaindex/utils.py +204 -91
openlit/instrumentation/mem0/__init__.py +11 -2
openlit/instrumentation/mem0/mem0.py +50 -29
openlit/instrumentation/milvus/__init__.py +10 -2
openlit/instrumentation/milvus/milvus.py +31 -6
openlit/instrumentation/milvus/utils.py +166 -67
openlit/instrumentation/mistral/__init__.py +63 -18
openlit/instrumentation/mistral/async_mistral.py +63 -24
openlit/instrumentation/mistral/mistral.py +63 -24
openlit/instrumentation/mistral/utils.py +277 -69
openlit/instrumentation/multion/__init__.py +69 -19
openlit/instrumentation/multion/async_multion.py +57 -26
openlit/instrumentation/multion/multion.py +57 -26
openlit/instrumentation/ollama/__init__.py +39 -18
openlit/instrumentation/ollama/async_ollama.py +57 -26
openlit/instrumentation/ollama/ollama.py +57 -26
openlit/instrumentation/ollama/utils.py +226 -50
openlit/instrumentation/openai/__init__.py +156 -32
openlit/instrumentation/openai/async_openai.py +147 -67
openlit/instrumentation/openai/openai.py +150 -67
openlit/instrumentation/openai/utils.py +657 -185
openlit/instrumentation/openai_agents/__init__.py +5 -1
openlit/instrumentation/openai_agents/processor.py +110 -90
openlit/instrumentation/phidata/__init__.py +13 -5
openlit/instrumentation/phidata/phidata.py +67 -32
openlit/instrumentation/pinecone/__init__.py +48 -9
openlit/instrumentation/pinecone/async_pinecone.py +27 -5
openlit/instrumentation/pinecone/pinecone.py +27 -5
openlit/instrumentation/pinecone/utils.py +153 -47
openlit/instrumentation/premai/__init__.py +22 -7
openlit/instrumentation/premai/premai.py +51 -26
openlit/instrumentation/premai/utils.py +246 -59
openlit/instrumentation/pydantic_ai/__init__.py +49 -22
openlit/instrumentation/pydantic_ai/pydantic_ai.py +69 -16
openlit/instrumentation/pydantic_ai/utils.py +89 -24
openlit/instrumentation/qdrant/__init__.py +19 -4
openlit/instrumentation/qdrant/async_qdrant.py +33 -7
openlit/instrumentation/qdrant/qdrant.py +33 -7
openlit/instrumentation/qdrant/utils.py +228 -93
openlit/instrumentation/reka/__init__.py +23 -10
openlit/instrumentation/reka/async_reka.py +17 -11
openlit/instrumentation/reka/reka.py +17 -11
openlit/instrumentation/reka/utils.py +138 -36
openlit/instrumentation/together/__init__.py +44 -12
openlit/instrumentation/together/async_together.py +50 -27
openlit/instrumentation/together/together.py +50 -27
openlit/instrumentation/together/utils.py +301 -71
openlit/instrumentation/transformers/__init__.py +2 -1
openlit/instrumentation/transformers/transformers.py +13 -3
openlit/instrumentation/transformers/utils.py +139 -36
openlit/instrumentation/vertexai/__init__.py +81 -16
openlit/instrumentation/vertexai/async_vertexai.py +33 -15
openlit/instrumentation/vertexai/utils.py +123 -27
openlit/instrumentation/vertexai/vertexai.py +33 -15
openlit/instrumentation/vllm/__init__.py +12 -5
openlit/instrumentation/vllm/utils.py +121 -31
openlit/instrumentation/vllm/vllm.py +16 -10
openlit/otel/events.py +35 -10
openlit/otel/metrics.py +32 -24
openlit/otel/tracing.py +24 -9
openlit/semcov/__init__.py +82 -6
{openlit-1.34.30.dist-info → openlit-1.34.32.dist-info}/METADATA +2 -1
openlit-1.34.32.dist-info/RECORD +166 -0
openlit/instrumentation/langchain/async_langchain.py +0 -102
openlit/instrumentation/langchain/langchain.py +0 -102
openlit/instrumentation/langchain/utils.py +0 -252
openlit-1.34.30.dist-info/RECORD +0 -168
{openlit-1.34.30.dist-info → openlit-1.34.32.dist-info}/LICENSE +0 -0
{openlit-1.34.30.dist-info → openlit-1.34.32.dist-info}/WHEEL +0 -0

openlit/instrumentation/azure_ai_inference/utils.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """
 Azure AI Inference OpenTelemetry instrumentation utility functions
 """
 import time
 from opentelemetry.trace import Status, StatusCode
@@ -17,6 +18,7 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def format_content(messages):
     """
     Process a list of messages to extract content.
@@ -29,15 +31,17 @@ def format_content(messages):
         if isinstance(content, list):
             content_str = ", ".join(
-                f'{item["type"]}: {item["text"] if "text" in item else item.get("image_url", "")}'
-                if "type" in item else f'text: {item.get("text", "")}'
+                f"{item['type']}: {item['text'] if 'text' in item else item.get('image_url', '')}"
+                if "type" in item
+                else f"text: {item.get('text', '')}"
                 for item in content
             )
-            formatted_messages.append(f'{role}: {content_str}')
+            formatted_messages.append(f"{role}: {content_str}")
         else:
-            formatted_messages.append(f'{role}: {content}')
+            formatted_messages.append(f"{role}: {content}")
+    return "\n".join(formatted_messages)
-    return '\n'.join(formatted_messages)
 def process_chunk(scope, chunk):
     """
@@ -92,25 +96,44 @@ def process_chunk(scope, chunk):
                     func = tool.get("function", {})
                     scope._tools[idx] = {
                         "id": tool["id"],
-                        "function": {"name": func.get("name", ""), "arguments": func.get("arguments", "")},
-                        "type": tool.get("type", "function")
+                        "function": {
+                            "name": func.get("name", ""),
+                            "arguments": func.get("arguments", ""),
+                        },
+                        "type": tool.get("type", "function"),
                     }
-                elif scope._tools[idx] and "function" in tool:  # Append args (id is None)
-                    scope._tools[idx]["function"]["arguments"] += tool["function"].get("arguments", "")
+                elif (
+                    scope._tools[idx] and "function" in tool
+                ):  # Append args (id is None)
+                    scope._tools[idx]["function"]["arguments"] += tool["function"].get(
+                        "arguments", ""
+                    )
     # Handle usage information (typically only in final chunk)
     if chunked.get("usage"):
         scope._input_tokens = chunked.get("usage").get("prompt_tokens", 0)
         scope._output_tokens = chunked.get("usage").get("completion_tokens", 0)
         # Handle reasoning tokens if present (optional) - check nested structure
-        completion_details = chunked.get("usage", {}).get("completion_tokens_details", {})
+        completion_details = chunked.get("usage", {}).get(
+            "completion_tokens_details", {}
+        )
         if "reasoning_tokens" in completion_details:
             scope._reasoning_tokens = completion_details.get("reasoning_tokens", 0)
         elif "reasoning_tokens" in chunked.get("usage", {}):
             scope._reasoning_tokens = chunked.get("usage").get("reasoning_tokens", 0)
-def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version, is_stream):
+def common_chat_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -121,65 +144,134 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     prompt = format_content(scope._kwargs.get("messages", []))
     request_model = scope._kwargs.get("model", "gpt-4o")
-    cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    cost = get_chat_model_cost(
+        request_model, pricing_info, scope._input_tokens, scope._output_tokens
+    )
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
-        scope._server_address, scope._server_port, request_model, scope._response_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        scope._response_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, scope._kwargs.get("frequency_penalty", 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, scope._kwargs.get("max_tokens", -1))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, scope._kwargs.get("presence_penalty", 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get("stop", []))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, scope._kwargs.get("temperature", 1.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 1.0))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+        scope._kwargs.get("frequency_penalty", 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
+        scope._kwargs.get("max_tokens", -1),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
+        scope._kwargs.get("presence_penalty", 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get("stop", [])
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
+        scope._kwargs.get("temperature", 1.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 1.0)
+    )
     # Span Attributes for Response parameters
     scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID, scope._response_id)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_SERVICE_TIER, scope._response_service_tier)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT, scope._response_service_tier)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason]
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_SERVICE_TIER, scope._response_service_tier
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT,
+        scope._response_service_tier,
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+        scope._input_tokens + scope._output_tokens,
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Reasoning (if present)
     if hasattr(scope, "_reasoning_tokens") and scope._reasoning_tokens > 0:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_REASONING_TOKENS, scope._reasoning_tokens)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_USAGE_REASONING_TOKENS, scope._reasoning_tokens
+        )
         # Update total token usage to include reasoning tokens
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
-                                scope._input_tokens + scope._output_tokens + scope._reasoning_tokens)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+            scope._input_tokens + scope._output_tokens + scope._reasoning_tokens,
+        )
     # Span Attributes for Tools - optimized
     if scope._tools:
         tools = scope._tools if isinstance(scope._tools, list) else [scope._tools]
-        names, ids, args = zip(*[
-            (t.get("function", {}).get("name", ""),
-             str(t.get("id", "")),
-             str(t.get("function", {}).get("arguments", "")))
-            for t in tools if isinstance(t, dict) and t
-        ]) if tools else ([], [], [])
+        names, ids, args = (
+            zip(
+                *[
+                    (
+                        t.get("function", {}).get("name", ""),
+                        str(t.get("id", "")),
+                        str(t.get("function", {}).get("arguments", "")),
+                    )
+                    for t in tools
+                    if isinstance(t, dict) and t
+                ]
+            )
+            if tools
+            else ([], [], [])
+        )
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_NAME, ", ".join(filter(None, names)))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALL_ID, ", ".join(filter(None, ids)))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_ARGS, ", ".join(filter(None, args)))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_NAME, ", ".join(filter(None, names))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_CALL_ID, ", ".join(filter(None, ids))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_ARGS, ", ".join(filter(None, args))
+        )
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # Add reasoning content if available
         if hasattr(scope, "_reasoning_content") and scope._reasoning_content:
-            scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_REASONING, scope._reasoning_content)
+            scope._span.set_attribute(
+                SemanticConvention.GEN_AI_CONTENT_REASONING, scope._reasoning_content
+            )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -199,23 +291,69 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
-            SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE, scope._server_address, scope._server_port,
-            request_model, scope._response_model, environment,  application_name, scope._start_time, scope._end_time,
-            scope._input_tokens, scope._output_tokens, cost, scope._tbt, scope._ttft)
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            scope._response_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            scope._output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
-def process_streaming_chat_response(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content=False, disable_metrics=False, version=""):
+def process_streaming_chat_response(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="",
+):
     """
     Process streaming chat request and generate Telemetry
     """
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=True)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=True,
+    )
-def process_chat_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+def process_chat_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -232,14 +370,20 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
         for choice in response_dict.get("choices", [])
     )
     # Handle reasoning content from non-streaming response
-    reasoning_content = response_dict.get("choices", [{}])[0].get("message", {}).get("reasoning_content")
+    reasoning_content = (
+        response_dict.get("choices", [{}])[0]
+        .get("message", {})
+        .get("reasoning_content")
+    )
     if reasoning_content:
         scope._reasoning_content = reasoning_content
     scope._input_tokens = response_dict.get("usage", {}).get("prompt_tokens", 0)
     scope._output_tokens = response_dict.get("usage", {}).get("completion_tokens", 0)
     # Handle reasoning tokens if present (optional) - check nested structure
-    completion_details = response_dict.get("usage", {}).get("completion_tokens_details", {})
+    completion_details = response_dict.get("usage", {}).get(
+        "completion_tokens_details", {}
+    )
     if "reasoning_tokens" in completion_details:
         scope._reasoning_tokens = completion_details.get("reasoning_tokens", 0)
     elif "reasoning_tokens" in response_dict.get("usage", {}):
@@ -248,7 +392,9 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
         scope._reasoning_tokens = 0
     scope._response_id = response_dict.get("id")
     scope._response_model = response_dict.get("model")
-    scope._finish_reason = str(response_dict.get("choices", [])[0].get("finish_reason", ""))
+    scope._finish_reason = str(
+        response_dict.get("choices", [])[0].get("finish_reason", "")
+    )
     scope._response_service_tier = str(response_dict.get("system_fingerprint", ""))
     scope._timestamps = []
     scope._ttft, scope._tbt = scope._end_time - scope._start_time, 0
@@ -257,17 +403,37 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
     # Handle tool calls
     if scope._kwargs.get("tools"):
-        scope._tools = response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        scope._tools = (
+            response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        )
     else:
         scope._tools = None
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=False)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response
-def common_embedding_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version):
+def common_embedding_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+):
     """
     Process embedding request and generate Telemetry
     """
@@ -277,29 +443,54 @@ def common_embedding_logic(scope, pricing_info, environment, application_name, m
     cost = get_embed_model_cost(request_model, pricing_info, scope._input_tokens)
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING, SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
-        scope._server_address, scope._server_port, request_model, scope._response_model,
-        environment, application_name, False, 0, scope._end_time - scope._start_time, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+        SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        scope._response_model,
+        environment,
+        application_name,
+        False,
+        0,
+        scope._end_time - scope._start_time,
+        version,
+    )
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_ENCODING_FORMATS, [scope._kwargs.get("encoding_format", "float")])
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_USER, scope._kwargs.get("user", ""))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_ENCODING_FORMATS,
+        [scope._kwargs.get("encoding_format", "float")],
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_USER, scope._kwargs.get("user", "")
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Content
     if capture_message_content:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, str(scope._kwargs.get("input", "")))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_PROMPT,
+            str(scope._kwargs.get("input", "")),
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
             name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
             attributes={
-                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(scope._kwargs.get("input", "")),
+                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(
+                    scope._kwargs.get("input", "")
+                ),
             },
         )
@@ -307,14 +498,39 @@ def common_embedding_logic(scope, pricing_info, environment, application_name, m
     # Metrics
     if not disable_metrics:
-        record_embedding_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
-            SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE, scope._server_address, scope._server_port,
-            request_model, scope._response_model, environment, application_name, scope._start_time, scope._end_time,
-            scope._input_tokens, cost)
-def process_embedding_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+        record_embedding_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+            SemanticConvention.GEN_AI_SYSTEM_AZURE_AI_INFERENCE,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            scope._response_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            cost,
+        )
+def process_embedding_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process embedding request and generate Telemetry
     """
@@ -331,7 +547,15 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     scope._server_address, scope._server_port = server_address, server_port
     scope._kwargs = kwargs
-    common_embedding_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version)
+    common_embedding_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+    )
     return response

openlit/instrumentation/bedrock/__init__.py CHANGED Viewed

@@ -9,6 +9,7 @@ from openlit.instrumentation.bedrock.bedrock import converse, converse_stream
 _instruments = ("boto3 >= 1.34.138",)
 class BedrockInstrumentor(BaseInstrumentor):
     """
     An instrumentor for AWS Bedrock client library.
@@ -31,16 +32,32 @@ class BedrockInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "botocore.client",
             "ClientCreator.create_client",
-            converse(version, environment, application_name, tracer, pricing_info,
-                capture_message_content, metrics, disable_metrics),
+            converse(
+                version,
+                environment,
+                application_name,
+                tracer,
+                pricing_info,
+                capture_message_content,
+                metrics,
+                disable_metrics,
+            ),
         )
         # streaming
         wrap_function_wrapper(
             "botocore.client",
             "ClientCreator.create_client",
-            converse_stream(version, environment, application_name, tracer, pricing_info,
-                capture_message_content, metrics, disable_metrics),
+            converse_stream(
+                version,
+                environment,
+                application_name,
+                tracer,
+                pricing_info,
+                capture_message_content,
+                metrics,
+                disable_metrics,
+            ),
         )
     def _uninstrument(self, **kwargs):

openlit 1.34.30__py3-none-any.whl → 1.34.32__py3-none-any.whl

openlit 1.34.30py3-none-any.whl → 1.34.32py3-none-any.whl