PyPI - openlit - Versions diffs - 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl - Mend

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

openlit/__helpers.py +235 -86
openlit/__init__.py +16 -13
openlit/_instrumentors.py +2 -1
openlit/evals/all.py +50 -21
openlit/evals/bias_detection.py +47 -20
openlit/evals/hallucination.py +53 -22
openlit/evals/toxicity.py +50 -21
openlit/evals/utils.py +54 -30
openlit/guard/all.py +61 -19
openlit/guard/prompt_injection.py +34 -14
openlit/guard/restrict_topic.py +46 -15
openlit/guard/sensitive_topic.py +34 -14
openlit/guard/utils.py +58 -22
openlit/instrumentation/ag2/__init__.py +24 -8
openlit/instrumentation/ag2/ag2.py +34 -13
openlit/instrumentation/ag2/async_ag2.py +34 -13
openlit/instrumentation/ag2/utils.py +133 -30
openlit/instrumentation/ai21/__init__.py +43 -14
openlit/instrumentation/ai21/ai21.py +47 -21
openlit/instrumentation/ai21/async_ai21.py +47 -21
openlit/instrumentation/ai21/utils.py +299 -78
openlit/instrumentation/anthropic/__init__.py +21 -4
openlit/instrumentation/anthropic/anthropic.py +28 -17
openlit/instrumentation/anthropic/async_anthropic.py +28 -17
openlit/instrumentation/anthropic/utils.py +145 -35
openlit/instrumentation/assemblyai/__init__.py +11 -2
openlit/instrumentation/assemblyai/assemblyai.py +15 -4
openlit/instrumentation/assemblyai/utils.py +120 -25
openlit/instrumentation/astra/__init__.py +43 -10
openlit/instrumentation/astra/astra.py +28 -5
openlit/instrumentation/astra/async_astra.py +28 -5
openlit/instrumentation/astra/utils.py +151 -55
openlit/instrumentation/azure_ai_inference/__init__.py +43 -10
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/utils.py +307 -83
openlit/instrumentation/bedrock/__init__.py +21 -4
openlit/instrumentation/bedrock/bedrock.py +63 -25
openlit/instrumentation/bedrock/utils.py +139 -30
openlit/instrumentation/chroma/__init__.py +89 -16
openlit/instrumentation/chroma/chroma.py +28 -6
openlit/instrumentation/chroma/utils.py +167 -51
openlit/instrumentation/cohere/__init__.py +63 -18
openlit/instrumentation/cohere/async_cohere.py +63 -24
openlit/instrumentation/cohere/cohere.py +63 -24
openlit/instrumentation/cohere/utils.py +286 -73
openlit/instrumentation/controlflow/__init__.py +35 -9
openlit/instrumentation/controlflow/controlflow.py +66 -33
openlit/instrumentation/crawl4ai/__init__.py +25 -10
openlit/instrumentation/crawl4ai/async_crawl4ai.py +78 -31
openlit/instrumentation/crawl4ai/crawl4ai.py +78 -31
openlit/instrumentation/crewai/__init__.py +40 -15
openlit/instrumentation/crewai/async_crewai.py +32 -7
openlit/instrumentation/crewai/crewai.py +32 -7
openlit/instrumentation/crewai/utils.py +159 -56
openlit/instrumentation/dynamiq/__init__.py +46 -12
openlit/instrumentation/dynamiq/dynamiq.py +74 -33
openlit/instrumentation/elevenlabs/__init__.py +23 -4
openlit/instrumentation/elevenlabs/async_elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/utils.py +128 -25
openlit/instrumentation/embedchain/__init__.py +11 -2
openlit/instrumentation/embedchain/embedchain.py +68 -35
openlit/instrumentation/firecrawl/__init__.py +24 -7
openlit/instrumentation/firecrawl/firecrawl.py +46 -20
openlit/instrumentation/google_ai_studio/__init__.py +45 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/utils.py +180 -67
openlit/instrumentation/gpt4all/__init__.py +22 -7
openlit/instrumentation/gpt4all/gpt4all.py +67 -29
openlit/instrumentation/gpt4all/utils.py +285 -61
openlit/instrumentation/gpu/__init__.py +128 -47
openlit/instrumentation/groq/__init__.py +21 -4
openlit/instrumentation/groq/async_groq.py +33 -21
openlit/instrumentation/groq/groq.py +33 -21
openlit/instrumentation/groq/utils.py +192 -55
openlit/instrumentation/haystack/__init__.py +70 -24
openlit/instrumentation/haystack/async_haystack.py +28 -6
openlit/instrumentation/haystack/haystack.py +28 -6
openlit/instrumentation/haystack/utils.py +196 -74
openlit/instrumentation/julep/__init__.py +69 -19
openlit/instrumentation/julep/async_julep.py +53 -27
openlit/instrumentation/julep/julep.py +53 -28
openlit/instrumentation/langchain/__init__.py +74 -63
openlit/instrumentation/langchain/callback_handler.py +1100 -0
openlit/instrumentation/langchain_community/__init__.py +13 -2
openlit/instrumentation/langchain_community/async_langchain_community.py +23 -5
openlit/instrumentation/langchain_community/langchain_community.py +23 -5
openlit/instrumentation/langchain_community/utils.py +35 -9
openlit/instrumentation/letta/__init__.py +68 -15
openlit/instrumentation/letta/letta.py +99 -54
openlit/instrumentation/litellm/__init__.py +43 -14
openlit/instrumentation/litellm/async_litellm.py +51 -26
openlit/instrumentation/litellm/litellm.py +51 -26
openlit/instrumentation/litellm/utils.py +304 -102
openlit/instrumentation/llamaindex/__init__.py +267 -90
openlit/instrumentation/llamaindex/async_llamaindex.py +28 -6
openlit/instrumentation/llamaindex/llamaindex.py +28 -6
openlit/instrumentation/llamaindex/utils.py +204 -91
openlit/instrumentation/mem0/__init__.py +11 -2
openlit/instrumentation/mem0/mem0.py +50 -29
openlit/instrumentation/milvus/__init__.py +10 -2
openlit/instrumentation/milvus/milvus.py +31 -6
openlit/instrumentation/milvus/utils.py +166 -67
openlit/instrumentation/mistral/__init__.py +63 -18
openlit/instrumentation/mistral/async_mistral.py +63 -24
openlit/instrumentation/mistral/mistral.py +63 -24
openlit/instrumentation/mistral/utils.py +277 -69
openlit/instrumentation/multion/__init__.py +69 -19
openlit/instrumentation/multion/async_multion.py +57 -26
openlit/instrumentation/multion/multion.py +57 -26
openlit/instrumentation/ollama/__init__.py +39 -18
openlit/instrumentation/ollama/async_ollama.py +57 -26
openlit/instrumentation/ollama/ollama.py +57 -26
openlit/instrumentation/ollama/utils.py +226 -50
openlit/instrumentation/openai/__init__.py +156 -32
openlit/instrumentation/openai/async_openai.py +147 -67
openlit/instrumentation/openai/openai.py +150 -67
openlit/instrumentation/openai/utils.py +657 -185
openlit/instrumentation/openai_agents/__init__.py +5 -1
openlit/instrumentation/openai_agents/processor.py +110 -90
openlit/instrumentation/phidata/__init__.py +13 -5
openlit/instrumentation/phidata/phidata.py +67 -32
openlit/instrumentation/pinecone/__init__.py +48 -9
openlit/instrumentation/pinecone/async_pinecone.py +27 -5
openlit/instrumentation/pinecone/pinecone.py +27 -5
openlit/instrumentation/pinecone/utils.py +153 -47
openlit/instrumentation/premai/__init__.py +22 -7
openlit/instrumentation/premai/premai.py +51 -26
openlit/instrumentation/premai/utils.py +246 -59
openlit/instrumentation/pydantic_ai/__init__.py +49 -22
openlit/instrumentation/pydantic_ai/pydantic_ai.py +69 -16
openlit/instrumentation/pydantic_ai/utils.py +89 -24
openlit/instrumentation/qdrant/__init__.py +19 -4
openlit/instrumentation/qdrant/async_qdrant.py +33 -7
openlit/instrumentation/qdrant/qdrant.py +33 -7
openlit/instrumentation/qdrant/utils.py +228 -93
openlit/instrumentation/reka/__init__.py +23 -10
openlit/instrumentation/reka/async_reka.py +17 -11
openlit/instrumentation/reka/reka.py +17 -11
openlit/instrumentation/reka/utils.py +138 -36
openlit/instrumentation/together/__init__.py +44 -12
openlit/instrumentation/together/async_together.py +50 -27
openlit/instrumentation/together/together.py +50 -27
openlit/instrumentation/together/utils.py +301 -71
openlit/instrumentation/transformers/__init__.py +2 -1
openlit/instrumentation/transformers/transformers.py +13 -3
openlit/instrumentation/transformers/utils.py +139 -36
openlit/instrumentation/vertexai/__init__.py +81 -16
openlit/instrumentation/vertexai/async_vertexai.py +33 -15
openlit/instrumentation/vertexai/utils.py +123 -27
openlit/instrumentation/vertexai/vertexai.py +33 -15
openlit/instrumentation/vllm/__init__.py +12 -5
openlit/instrumentation/vllm/utils.py +121 -31
openlit/instrumentation/vllm/vllm.py +16 -10
openlit/otel/events.py +35 -10
openlit/otel/metrics.py +32 -24
openlit/otel/tracing.py +24 -9
openlit/semcov/__init__.py +72 -6
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/METADATA +2 -1
openlit-1.34.31.dist-info/RECORD +166 -0
openlit/instrumentation/langchain/async_langchain.py +0 -102
openlit/instrumentation/langchain/langchain.py +0 -102
openlit/instrumentation/langchain/utils.py +0 -252
openlit-1.34.30.dist-info/RECORD +0 -168
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/LICENSE +0 -0
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/WHEEL +0 -0

openlit/instrumentation/ai21/utils.py CHANGED Viewed

@@ -17,6 +17,7 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def format_content(messages):
     """
     Process a list of messages to extract content.
@@ -25,9 +26,15 @@ def format_content(messages):
     formatted_messages = []
     for message in messages:
         # Handle different message formats
-        if hasattr(message, "role") and (hasattr(message, "content") or hasattr(message, "text")):
+        if hasattr(message, "role") and (
+            hasattr(message, "content") or hasattr(message, "text")
+        ):
             # ChatMessage object (AI21 format)
-            role = str(message.role) if hasattr(message.role, 'value') else str(message.role)
+            role = (
+                str(message.role)
+                if hasattr(message.role, "value")
+                else str(message.role)
+            )
             content = getattr(message, "content", None) or getattr(message, "text", "")
         elif isinstance(message, dict):
             # Dictionary format
@@ -36,12 +43,15 @@ def format_content(messages):
         else:
             # Fallback - try to extract as string
             role = str(getattr(message, "role", "unknown"))
-            content = str(getattr(message, "content", "") or getattr(message, "text", ""))
+            content = str(
+                getattr(message, "content", "") or getattr(message, "text", "")
+            )
         if isinstance(content, list):
             content_str = ", ".join(
-                f'{item["type"]}: {item["text"] if "text" in item else item["image_url"]}'
-                if "type" in item else f'text: {item["text"]}'
+                f"{item['type']}: {item['text'] if 'text' in item else item['image_url']}"
+                if "type" in item
+                else f"text: {item['text']}"
                 for item in content
             )
             formatted_messages.append(f"{role}: {content_str}")
@@ -50,6 +60,7 @@ def format_content(messages):
     return "\n".join(formatted_messages)
 def process_chunk(scope, chunk):
     """
     Process a chunk of response data and update state.
@@ -66,10 +77,11 @@ def process_chunk(scope, chunk):
     chunked = response_as_dict(chunk)
     # Collect message IDs and aggregated response from events
-    if (len(chunked.get("choices", [])) > 0 and
-        "delta" in chunked.get("choices")[0] and
-        "content" in chunked.get("choices")[0].get("delta", {})):
+    if (
+        len(chunked.get("choices", [])) > 0
+        and "delta" in chunked.get("choices")[0]
+        and "content" in chunked.get("choices")[0].get("delta", {})
+    ):
         content = chunked.get("choices")[0].get("delta").get("content")
         if content:
             scope._llmresponse += content
@@ -81,8 +93,18 @@ def process_chunk(scope, chunk):
         scope._finish_reason = chunked.get("choices", [{}])[0].get("finish_reason")
         scope._end_time = time.time()
-def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version, is_stream):
+def common_chat_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -93,44 +115,97 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     prompt = format_content(scope._kwargs.get("messages", []))
     request_model = scope._kwargs.get("model", "jamba-1.5-mini")
-    cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    cost = get_chat_model_cost(
+        request_model, pricing_info, scope._input_tokens, scope._output_tokens
+    )
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_AI21,
-        scope._server_address, scope._server_port, request_model, request_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_AI21,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        request_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_SEED, scope._kwargs.get("seed", ""))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, scope._kwargs.get("frequency_penalty", 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, scope._kwargs.get("max_tokens", -1))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, scope._kwargs.get("presence_penalty", 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get("stop", []))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, scope._kwargs.get("temperature", 0.4))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 1.0))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_SEED, scope._kwargs.get("seed", "")
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+        scope._kwargs.get("frequency_penalty", 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
+        scope._kwargs.get("max_tokens", -1),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
+        scope._kwargs.get("presence_penalty", 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get("stop", [])
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
+        scope._kwargs.get("temperature", 0.4),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 1.0)
+    )
     # Span Attributes for Response parameters
     scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID, scope._response_id)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason]
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+        scope._input_tokens + scope._output_tokens,
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Tools
     if scope._tools:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_NAME, scope._tools.get("function", {}).get("name", ""))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALL_ID, str(scope._tools.get("id", "")))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_ARGS, str(scope._tools.get("function", {}).get("arguments", "")))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_NAME,
+            scope._tools.get("function", {}).get("name", ""),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_CALL_ID, str(scope._tools.get("id", ""))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_ARGS,
+            str(scope._tools.get("function", {}).get("arguments", "")),
+        )
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -150,23 +225,69 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_AI21,
-            scope._server_address, scope._server_port, request_model, request_model, environment,
-            application_name, scope._start_time, scope._end_time, scope._input_tokens, scope._output_tokens,
-            cost, scope._tbt, scope._ttft)
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_AI21,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            request_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            scope._output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
-def process_streaming_chat_response(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content=False, disable_metrics=False, version=""):
+def process_streaming_chat_response(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="",
+):
     """
     Process streaming chat request and generate Telemetry
     """
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=True)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=True,
+    )
-def process_chat_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+def process_chat_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -189,21 +310,43 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
     scope._ttft, scope._tbt = scope._end_time - scope._start_time, 0
     scope._server_address, scope._server_port = server_address, server_port
     scope._kwargs = kwargs
-    scope._finish_reason = str(response_dict.get("choices", [])[0].get("finish_reason", ""))
+    scope._finish_reason = str(
+        response_dict.get("choices", [])[0].get("finish_reason", "")
+    )
     # Handle tool calls
     if scope._kwargs.get("tools"):
-        scope._tools = response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        scope._tools = (
+            response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        )
     else:
         scope._tools = None
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=False)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response
-def common_chat_rag_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version):
+def common_chat_rag_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+):
     """
     Process RAG chat request and generate Telemetry
     """
@@ -211,40 +354,82 @@ def common_chat_rag_logic(scope, pricing_info, environment, application_name, me
     prompt = format_content(scope._kwargs.get("messages", []))
     request_model = scope._kwargs.get("model", "jamba-1.5-mini")
-    cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    cost = get_chat_model_cost(
+        request_model, pricing_info, scope._input_tokens, scope._output_tokens
+    )
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_AI21,
-        scope._server_address, scope._server_port, request_model, scope._response_model,
-        environment, application_name, False, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_AI21,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        scope._response_model,
+        environment,
+        application_name,
+        False,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # RAG-specific span attributes
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_MAX_SEGMENTS, scope._kwargs.get("max_segments", -1))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_STRATEGY, scope._kwargs.get("retrieval_strategy", "segments"))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_MAX_NEIGHBORS, scope._kwargs.get("max_neighbors", -1))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_FILE_IDS, str(scope._kwargs.get("file_ids", "")))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_DOCUMENTS_PATH, scope._kwargs.get("path", ""))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RAG_SIMILARITY_THRESHOLD,
-                                scope._kwargs.get("retrieval_similarity_threshold", -1))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_MAX_SEGMENTS,
+        scope._kwargs.get("max_segments", -1),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_STRATEGY,
+        scope._kwargs.get("retrieval_strategy", "segments"),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_MAX_NEIGHBORS,
+        scope._kwargs.get("max_neighbors", -1),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_FILE_IDS, str(scope._kwargs.get("file_ids", ""))
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_DOCUMENTS_PATH, scope._kwargs.get("path", "")
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RAG_SIMILARITY_THRESHOLD,
+        scope._kwargs.get("retrieval_similarity_threshold", -1),
+    )
     # Standard span attributes
     scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID, scope._response_id)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+        scope._input_tokens + scope._output_tokens,
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Handle tool calls
     if scope._kwargs.get("tools"):
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALLS,
-            str(scope._choices[0].get("message", {}).get("tool_calls", "")))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_CALLS,
+            str(scope._choices[0].get("message", {}).get("tool_calls", "")),
+        )
     # Content attributes
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -264,14 +449,42 @@ def common_chat_rag_logic(scope, pricing_info, environment, application_name, me
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_AI21,
-            scope._server_address, scope._server_port, request_model, scope._response_model, environment,
-            application_name, scope._start_time, scope._end_time, scope._input_tokens, scope._output_tokens,
-            cost, scope._tbt, scope._ttft)
-def process_chat_rag_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_AI21,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            scope._response_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            scope._output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
+def process_chat_rag_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process RAG chat request and generate Telemetry
     """
@@ -311,7 +524,15 @@ def process_chat_rag_response(response, request_model, pricing_info, server_port
     scope._tools = None
     scope._choices = choices
-    common_chat_rag_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version)
+    common_chat_rag_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+    )
     return response

openlit/instrumentation/anthropic/__init__.py CHANGED Viewed

@@ -10,6 +10,7 @@ from openlit.instrumentation.anthropic.async_anthropic import async_messages
 _instruments = ("anthropic >= 0.21.0",)
 class AnthropicInstrumentor(BaseInstrumentor):
     """
     An instrumentor for Anthropic's client library.
@@ -32,16 +33,32 @@ class AnthropicInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "anthropic.resources.messages",
             "Messages.create",
-            messages(version, environment, application_name, tracer, pricing_info,
-                capture_message_content, metrics, disable_metrics),
+            messages(
+                version,
+                environment,
+                application_name,
+                tracer,
+                pricing_info,
+                capture_message_content,
+                metrics,
+                disable_metrics,
+            ),
         )
         # async
         wrap_function_wrapper(
             "anthropic.resources.messages",
             "AsyncMessages.create",
-            async_messages(version, environment, application_name, tracer, pricing_info,
-                capture_message_content, metrics, disable_metrics),
+            async_messages(
+                version,
+                environment,
+                application_name,
+                tracer,
+                pricing_info,
+                capture_message_content,
+                metrics,
+                disable_metrics,
+            ),
         )
     def _uninstrument(self, **kwargs):

openlit/instrumentation/anthropic/anthropic.py CHANGED Viewed

@@ -4,10 +4,7 @@ Module for monitoring Anthropic API calls.
 import time
 from opentelemetry.trace import SpanKind
-from openlit.__helpers import (
-    handle_exception,
-    set_server_address_and_port
-)
+from openlit.__helpers import handle_exception, set_server_address_and_port
 from openlit.instrumentation.anthropic.utils import (
     process_chunk,
     process_chat_response,
@@ -15,7 +12,17 @@ from openlit.instrumentation.anthropic.utils import (
 )
 from openlit.semcov import SemanticConvention
-def messages(version, environment, application_name, tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def messages(
+    version,
+    environment,
+    application_name,
+    tracer,
+    pricing_info,
+    capture_message_content,
+    metrics,
+    disable_metrics,
+):
     """
     Generates a telemetry wrapper for Anthropic Messages.create calls.
     """
@@ -26,14 +33,14 @@ def messages(version, environment, application_name, tracer, pricing_info, captu
         """
         def __init__(
-                self,
-                wrapped,
-                span,
-                span_name,
-                kwargs,
-                server_address,
-                server_port,
-            ):
+            self,
+            wrapped,
+            span,
+            span_name,
+            kwargs,
+            server_address,
+            server_port,
+        ):
             self.__wrapped__ = wrapped
             self._span = span
             self._span_name = span_name
@@ -87,7 +94,7 @@ def messages(version, environment, application_name, tracer, pricing_info, captu
                             metrics=metrics,
                             capture_message_content=capture_message_content,
                             disable_metrics=disable_metrics,
-                            version=version
+                            version=version,
                         )
                 except Exception as e:
                     handle_exception(self._span, e)
@@ -99,7 +106,9 @@ def messages(version, environment, application_name, tracer, pricing_info, captu
         """
         streaming = kwargs.get("stream", False)
-        server_address, server_port = set_server_address_and_port(instance, "api.anthropic.com", 443)
+        server_address, server_port = set_server_address_and_port(
+            instance, "api.anthropic.com", 443
+        )
         request_model = kwargs.get("model", "claude-3-5-sonnet-latest")
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
@@ -109,7 +118,9 @@ def messages(version, environment, application_name, tracer, pricing_info, captu
             awaited_wrapped = wrapped(*args, **kwargs)
             span = tracer.start_span(span_name, kind=SpanKind.CLIENT)
-            return TracedSyncStream(awaited_wrapped, span, span_name, kwargs, server_address, server_port)
+            return TracedSyncStream(
+                awaited_wrapped, span, span_name, kwargs, server_address, server_port
+            )
         else:
             with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
@@ -131,7 +142,7 @@ def messages(version, environment, application_name, tracer, pricing_info, captu
                         capture_message_content=capture_message_content,
                         disable_metrics=disable_metrics,
                         version=version,
-                        **kwargs
+                        **kwargs,
                     )
                 except Exception as e:

openlit 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl