PyPI - openlit - Versions diffs - 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl - Mend

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

openlit/__helpers.py +235 -86
openlit/__init__.py +16 -13
openlit/_instrumentors.py +2 -1
openlit/evals/all.py +50 -21
openlit/evals/bias_detection.py +47 -20
openlit/evals/hallucination.py +53 -22
openlit/evals/toxicity.py +50 -21
openlit/evals/utils.py +54 -30
openlit/guard/all.py +61 -19
openlit/guard/prompt_injection.py +34 -14
openlit/guard/restrict_topic.py +46 -15
openlit/guard/sensitive_topic.py +34 -14
openlit/guard/utils.py +58 -22
openlit/instrumentation/ag2/__init__.py +24 -8
openlit/instrumentation/ag2/ag2.py +34 -13
openlit/instrumentation/ag2/async_ag2.py +34 -13
openlit/instrumentation/ag2/utils.py +133 -30
openlit/instrumentation/ai21/__init__.py +43 -14
openlit/instrumentation/ai21/ai21.py +47 -21
openlit/instrumentation/ai21/async_ai21.py +47 -21
openlit/instrumentation/ai21/utils.py +299 -78
openlit/instrumentation/anthropic/__init__.py +21 -4
openlit/instrumentation/anthropic/anthropic.py +28 -17
openlit/instrumentation/anthropic/async_anthropic.py +28 -17
openlit/instrumentation/anthropic/utils.py +145 -35
openlit/instrumentation/assemblyai/__init__.py +11 -2
openlit/instrumentation/assemblyai/assemblyai.py +15 -4
openlit/instrumentation/assemblyai/utils.py +120 -25
openlit/instrumentation/astra/__init__.py +43 -10
openlit/instrumentation/astra/astra.py +28 -5
openlit/instrumentation/astra/async_astra.py +28 -5
openlit/instrumentation/astra/utils.py +151 -55
openlit/instrumentation/azure_ai_inference/__init__.py +43 -10
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/utils.py +307 -83
openlit/instrumentation/bedrock/__init__.py +21 -4
openlit/instrumentation/bedrock/bedrock.py +63 -25
openlit/instrumentation/bedrock/utils.py +139 -30
openlit/instrumentation/chroma/__init__.py +89 -16
openlit/instrumentation/chroma/chroma.py +28 -6
openlit/instrumentation/chroma/utils.py +167 -51
openlit/instrumentation/cohere/__init__.py +63 -18
openlit/instrumentation/cohere/async_cohere.py +63 -24
openlit/instrumentation/cohere/cohere.py +63 -24
openlit/instrumentation/cohere/utils.py +286 -73
openlit/instrumentation/controlflow/__init__.py +35 -9
openlit/instrumentation/controlflow/controlflow.py +66 -33
openlit/instrumentation/crawl4ai/__init__.py +25 -10
openlit/instrumentation/crawl4ai/async_crawl4ai.py +78 -31
openlit/instrumentation/crawl4ai/crawl4ai.py +78 -31
openlit/instrumentation/crewai/__init__.py +40 -15
openlit/instrumentation/crewai/async_crewai.py +32 -7
openlit/instrumentation/crewai/crewai.py +32 -7
openlit/instrumentation/crewai/utils.py +159 -56
openlit/instrumentation/dynamiq/__init__.py +46 -12
openlit/instrumentation/dynamiq/dynamiq.py +74 -33
openlit/instrumentation/elevenlabs/__init__.py +23 -4
openlit/instrumentation/elevenlabs/async_elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/utils.py +128 -25
openlit/instrumentation/embedchain/__init__.py +11 -2
openlit/instrumentation/embedchain/embedchain.py +68 -35
openlit/instrumentation/firecrawl/__init__.py +24 -7
openlit/instrumentation/firecrawl/firecrawl.py +46 -20
openlit/instrumentation/google_ai_studio/__init__.py +45 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/utils.py +180 -67
openlit/instrumentation/gpt4all/__init__.py +22 -7
openlit/instrumentation/gpt4all/gpt4all.py +67 -29
openlit/instrumentation/gpt4all/utils.py +285 -61
openlit/instrumentation/gpu/__init__.py +128 -47
openlit/instrumentation/groq/__init__.py +21 -4
openlit/instrumentation/groq/async_groq.py +33 -21
openlit/instrumentation/groq/groq.py +33 -21
openlit/instrumentation/groq/utils.py +192 -55
openlit/instrumentation/haystack/__init__.py +70 -24
openlit/instrumentation/haystack/async_haystack.py +28 -6
openlit/instrumentation/haystack/haystack.py +28 -6
openlit/instrumentation/haystack/utils.py +196 -74
openlit/instrumentation/julep/__init__.py +69 -19
openlit/instrumentation/julep/async_julep.py +53 -27
openlit/instrumentation/julep/julep.py +53 -28
openlit/instrumentation/langchain/__init__.py +74 -63
openlit/instrumentation/langchain/callback_handler.py +1100 -0
openlit/instrumentation/langchain_community/__init__.py +13 -2
openlit/instrumentation/langchain_community/async_langchain_community.py +23 -5
openlit/instrumentation/langchain_community/langchain_community.py +23 -5
openlit/instrumentation/langchain_community/utils.py +35 -9
openlit/instrumentation/letta/__init__.py +68 -15
openlit/instrumentation/letta/letta.py +99 -54
openlit/instrumentation/litellm/__init__.py +43 -14
openlit/instrumentation/litellm/async_litellm.py +51 -26
openlit/instrumentation/litellm/litellm.py +51 -26
openlit/instrumentation/litellm/utils.py +304 -102
openlit/instrumentation/llamaindex/__init__.py +267 -90
openlit/instrumentation/llamaindex/async_llamaindex.py +28 -6
openlit/instrumentation/llamaindex/llamaindex.py +28 -6
openlit/instrumentation/llamaindex/utils.py +204 -91
openlit/instrumentation/mem0/__init__.py +11 -2
openlit/instrumentation/mem0/mem0.py +50 -29
openlit/instrumentation/milvus/__init__.py +10 -2
openlit/instrumentation/milvus/milvus.py +31 -6
openlit/instrumentation/milvus/utils.py +166 -67
openlit/instrumentation/mistral/__init__.py +63 -18
openlit/instrumentation/mistral/async_mistral.py +63 -24
openlit/instrumentation/mistral/mistral.py +63 -24
openlit/instrumentation/mistral/utils.py +277 -69
openlit/instrumentation/multion/__init__.py +69 -19
openlit/instrumentation/multion/async_multion.py +57 -26
openlit/instrumentation/multion/multion.py +57 -26
openlit/instrumentation/ollama/__init__.py +39 -18
openlit/instrumentation/ollama/async_ollama.py +57 -26
openlit/instrumentation/ollama/ollama.py +57 -26
openlit/instrumentation/ollama/utils.py +226 -50
openlit/instrumentation/openai/__init__.py +156 -32
openlit/instrumentation/openai/async_openai.py +147 -67
openlit/instrumentation/openai/openai.py +150 -67
openlit/instrumentation/openai/utils.py +657 -185
openlit/instrumentation/openai_agents/__init__.py +5 -1
openlit/instrumentation/openai_agents/processor.py +110 -90
openlit/instrumentation/phidata/__init__.py +13 -5
openlit/instrumentation/phidata/phidata.py +67 -32
openlit/instrumentation/pinecone/__init__.py +48 -9
openlit/instrumentation/pinecone/async_pinecone.py +27 -5
openlit/instrumentation/pinecone/pinecone.py +27 -5
openlit/instrumentation/pinecone/utils.py +153 -47
openlit/instrumentation/premai/__init__.py +22 -7
openlit/instrumentation/premai/premai.py +51 -26
openlit/instrumentation/premai/utils.py +246 -59
openlit/instrumentation/pydantic_ai/__init__.py +49 -22
openlit/instrumentation/pydantic_ai/pydantic_ai.py +69 -16
openlit/instrumentation/pydantic_ai/utils.py +89 -24
openlit/instrumentation/qdrant/__init__.py +19 -4
openlit/instrumentation/qdrant/async_qdrant.py +33 -7
openlit/instrumentation/qdrant/qdrant.py +33 -7
openlit/instrumentation/qdrant/utils.py +228 -93
openlit/instrumentation/reka/__init__.py +23 -10
openlit/instrumentation/reka/async_reka.py +17 -11
openlit/instrumentation/reka/reka.py +17 -11
openlit/instrumentation/reka/utils.py +138 -36
openlit/instrumentation/together/__init__.py +44 -12
openlit/instrumentation/together/async_together.py +50 -27
openlit/instrumentation/together/together.py +50 -27
openlit/instrumentation/together/utils.py +301 -71
openlit/instrumentation/transformers/__init__.py +2 -1
openlit/instrumentation/transformers/transformers.py +13 -3
openlit/instrumentation/transformers/utils.py +139 -36
openlit/instrumentation/vertexai/__init__.py +81 -16
openlit/instrumentation/vertexai/async_vertexai.py +33 -15
openlit/instrumentation/vertexai/utils.py +123 -27
openlit/instrumentation/vertexai/vertexai.py +33 -15
openlit/instrumentation/vllm/__init__.py +12 -5
openlit/instrumentation/vllm/utils.py +121 -31
openlit/instrumentation/vllm/vllm.py +16 -10
openlit/otel/events.py +35 -10
openlit/otel/metrics.py +32 -24
openlit/otel/tracing.py +24 -9
openlit/semcov/__init__.py +72 -6
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/METADATA +2 -1
openlit-1.34.31.dist-info/RECORD +166 -0
openlit/instrumentation/langchain/async_langchain.py +0 -102
openlit/instrumentation/langchain/langchain.py +0 -102
openlit/instrumentation/langchain/utils.py +0 -252
openlit-1.34.30.dist-info/RECORD +0 -168
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/LICENSE +0 -0
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/WHEEL +0 -0

openlit/instrumentation/litellm/utils.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """
 LiteLLM OpenTelemetry instrumentation utility functions
 """
 import time
 from opentelemetry.trace import Status, StatusCode
@@ -17,6 +18,7 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def format_content(messages):
     """
     Process a list of messages to extract content.
@@ -24,20 +26,22 @@ def format_content(messages):
     formatted_messages = []
     for message in messages:
-        role = message['role']
-        content = message['content']
+        role = message["role"]
+        content = message["content"]
         if isinstance(content, list):
             content_str = ", ".join(
-                f'{item["type"]}: {item["text"] if "text" in item else item["image_url"]}'
-                if "type" in item else f'text: {item["text"]}'
+                f"{item['type']}: {item['text'] if 'text' in item else item['image_url']}"
+                if "type" in item
+                else f"text: {item['text']}"
                 for item in content
             )
-            formatted_messages.append(f'{role}: {content_str}')
+            formatted_messages.append(f"{role}: {content_str}")
         else:
-            formatted_messages.append(f'{role}: {content}')
+            formatted_messages.append(f"{role}: {content}")
+    return "\n".join(formatted_messages)
-    return '\n'.join(formatted_messages)
 def process_chunk(scope, chunk):
     """
@@ -55,45 +59,63 @@ def process_chunk(scope, chunk):
     chunked = response_as_dict(chunk)
     # Collect message IDs and aggregated response from events
-    if (len(chunked.get('choices', [])) > 0 and ('delta' in chunked.get('choices')[0] and
-        'content' in chunked.get('choices')[0].get('delta', {}))):
-        content = chunked.get('choices')[0].get('delta').get('content')
+    if len(chunked.get("choices", [])) > 0 and (
+        "delta" in chunked.get("choices")[0]
+        and "content" in chunked.get("choices")[0].get("delta", {})
+    ):
+        content = chunked.get("choices")[0].get("delta").get("content")
         if content:
             scope._llmresponse += content
         # Handle tool calls in streaming - optimized
-        delta_tools = chunked.get('choices', [{}])[0].get('delta', {}).get('tool_calls')
+        delta_tools = chunked.get("choices", [{}])[0].get("delta", {}).get("tool_calls")
         if delta_tools:
             scope._tools = scope._tools or []
             for tool in delta_tools:
-                idx = tool.get('index', 0)
+                idx = tool.get("index", 0)
                 # Extend list if needed
                 scope._tools.extend([{}] * (idx + 1 - len(scope._tools)))
-                if tool.get('id'):  # New tool (id exists)
-                    func = tool.get('function', {})
+                if tool.get("id"):  # New tool (id exists)
+                    func = tool.get("function", {})
                     scope._tools[idx] = {
-                        'id': tool['id'],
-                        'function': {'name': func.get('name', ''), 'arguments': func.get('arguments', '')},
-                        'type': tool.get('type', 'function')
+                        "id": tool["id"],
+                        "function": {
+                            "name": func.get("name", ""),
+                            "arguments": func.get("arguments", ""),
+                        },
+                        "type": tool.get("type", "function"),
                     }
-                elif scope._tools[idx] and 'function' in tool:  # Append args (id is None)
-                    scope._tools[idx]['function']['arguments'] += tool['function'].get('arguments', '')
-    if chunked.get('usage'):
-        scope._input_tokens = chunked.get('usage').get('prompt_tokens', 0)
-        scope._output_tokens = chunked.get('usage').get('completion_tokens', 0)
-        scope._response_id = chunked.get('id')
-        scope._response_model = chunked.get('model')
-        scope._finish_reason = chunked.get('choices', [{}])[0].get('finish_reason')
-        scope._response_service_tier = str(chunked.get('system_fingerprint', ''))
+                elif (
+                    scope._tools[idx] and "function" in tool
+                ):  # Append args (id is None)
+                    scope._tools[idx]["function"]["arguments"] += tool["function"].get(
+                        "arguments", ""
+                    )
+    if chunked.get("usage"):
+        scope._input_tokens = chunked.get("usage").get("prompt_tokens", 0)
+        scope._output_tokens = chunked.get("usage").get("completion_tokens", 0)
+        scope._response_id = chunked.get("id")
+        scope._response_model = chunked.get("model")
+        scope._finish_reason = chunked.get("choices", [{}])[0].get("finish_reason")
+        scope._response_service_tier = str(chunked.get("system_fingerprint", ""))
         scope._end_time = time.time()
-def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version, is_stream):
+def common_chat_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -101,65 +123,135 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     if len(scope._timestamps) > 1:
         scope._tbt = calculate_tbt(scope._timestamps)
-    prompt = format_content(scope._kwargs.get('messages', []))
-    request_model = scope._kwargs.get('model', 'openai/gpt-4o')
+    prompt = format_content(scope._kwargs.get("messages", []))
+    request_model = scope._kwargs.get("model", "openai/gpt-4o")
-    cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    cost = get_chat_model_cost(
+        request_model, pricing_info, scope._input_tokens, scope._output_tokens
+    )
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_LITELLM,
-        scope._server_address, scope._server_port, request_model, scope._response_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_LITELLM,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        scope._response_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Helper function to handle None values with proper defaults
     def safe_get(value, default):
         return default if value is None else value
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_SEED, safe_get(scope._kwargs.get('seed'), ''))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
-        safe_get(scope._kwargs.get('frequency_penalty'), 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, safe_get(scope._kwargs.get('max_tokens'), -1))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, safe_get(scope._kwargs.get('presence_penalty'), 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get('stop', []))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, safe_get(scope._kwargs.get('temperature'), 1.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, safe_get(scope._kwargs.get('top_p'), 1.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_USER, safe_get(scope._kwargs.get('user'), ''))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_SERVICE_TIER, safe_get(scope._kwargs.get('service_tier'), 'auto'))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_SEED, safe_get(scope._kwargs.get("seed"), "")
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+        safe_get(scope._kwargs.get("frequency_penalty"), 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
+        safe_get(scope._kwargs.get("max_tokens"), -1),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
+        safe_get(scope._kwargs.get("presence_penalty"), 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, scope._kwargs.get("stop", [])
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
+        safe_get(scope._kwargs.get("temperature"), 1.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TOP_P,
+        safe_get(scope._kwargs.get("top_p"), 1.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_USER, safe_get(scope._kwargs.get("user"), "")
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_SERVICE_TIER,
+        safe_get(scope._kwargs.get("service_tier"), "auto"),
+    )
     # Span Attributes for Response parameters
     scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID, scope._response_id)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_SERVICE_TIER, scope._response_service_tier)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT, scope._response_service_tier)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason]
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_SERVICE_TIER, scope._response_service_tier
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT,
+        scope._response_service_tier,
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+        scope._input_tokens + scope._output_tokens,
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Tools - optimized
     if scope._tools:
         tools = scope._tools if isinstance(scope._tools, list) else [scope._tools]
-        names, ids, args = zip(*[
-            (t.get("function", {}).get("name", ""),
-             str(t.get("id", "")),
-             str(t.get("function", {}).get("arguments", "")))
-            for t in tools if isinstance(t, dict) and t
-        ]) if tools else ([], [], [])
+        names, ids, args = (
+            zip(
+                *[
+                    (
+                        t.get("function", {}).get("name", ""),
+                        str(t.get("id", "")),
+                        str(t.get("function", {}).get("arguments", "")),
+                    )
+                    for t in tools
+                    if isinstance(t, dict) and t
+                ]
+            )
+            if tools
+            else ([], [], [])
+        )
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_NAME, ", ".join(filter(None, names)))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALL_ID, ", ".join(filter(None, ids)))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_ARGS, ", ".join(filter(None, args)))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_NAME, ", ".join(filter(None, names))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_CALL_ID, ", ".join(filter(None, ids))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_ARGS, ", ".join(filter(None, args))
+        )
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -179,23 +271,69 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_LITELLM,
-            scope._server_address, scope._server_port, request_model, scope._response_model, environment,
-            application_name, scope._start_time, scope._end_time, scope._input_tokens, scope._output_tokens,
-            cost, scope._tbt, scope._ttft)
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_LITELLM,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            scope._response_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            scope._output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
-def process_streaming_chat_response(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content=False, disable_metrics=False, version=""):
+def process_streaming_chat_response(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="",
+):
     """
     Process streaming chat request and generate Telemetry
     """
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=True)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=True,
+    )
-def process_chat_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+def process_chat_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -211,12 +349,14 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
         (choice.get("message", {}).get("content") or "")
         for choice in response_dict.get("choices", [])
     )
-    scope._input_tokens = response_dict.get('usage', {}).get('prompt_tokens', 0)
-    scope._output_tokens = response_dict.get('usage', {}).get('completion_tokens', 0)
-    scope._response_id = response_dict.get('id')
-    scope._response_model = response_dict.get('model')
-    scope._finish_reason = str(response_dict.get('choices', [])[0].get('finish_reason', ''))
-    scope._response_service_tier = str(response_dict.get('system_fingerprint', ''))
+    scope._input_tokens = response_dict.get("usage", {}).get("prompt_tokens", 0)
+    scope._output_tokens = response_dict.get("usage", {}).get("completion_tokens", 0)
+    scope._response_id = response_dict.get("id")
+    scope._response_model = response_dict.get("model")
+    scope._finish_reason = str(
+        response_dict.get("choices", [])[0].get("finish_reason", "")
+    )
+    scope._response_service_tier = str(response_dict.get("system_fingerprint", ""))
     scope._timestamps = []
     scope._ttft, scope._tbt = scope._end_time - scope._start_time, 0
     scope._server_address, scope._server_port = server_address, server_port
@@ -224,18 +364,43 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
     # Handle tool calls
     if scope._kwargs.get("tools"):
-        scope._tools = response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        scope._tools = (
+            response_dict.get("choices", [{}])[0].get("message", {}).get("tool_calls")
+        )
     else:
         scope._tools = None
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=False)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response
-def process_embedding_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+def process_embedding_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process embedding request and generate Telemetry
     """
@@ -247,8 +412,8 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     scope._start_time = start_time
     scope._end_time = time.time()
     scope._span = span
-    scope._input_tokens = response_dict.get('usage', {}).get('prompt_tokens', 0)
-    scope._response_model = response_dict.get('model')
+    scope._input_tokens = response_dict.get("usage", {}).get("prompt_tokens", 0)
+    scope._response_model = response_dict.get("model")
     scope._server_address, scope._server_port = server_address, server_port
     scope._kwargs = kwargs
@@ -256,33 +421,58 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     cost = get_embed_model_cost(request_model, pricing_info, scope._input_tokens)
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING, SemanticConvention.GEN_AI_SYSTEM_LITELLM,
-        scope._server_address, scope._server_port, request_model, scope._response_model,
-        environment, application_name, False, 0, scope._end_time - scope._start_time, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+        SemanticConvention.GEN_AI_SYSTEM_LITELLM,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        scope._response_model,
+        environment,
+        application_name,
+        False,
+        0,
+        scope._end_time - scope._start_time,
+        version,
+    )
     # Helper function to handle None values with proper defaults
     def safe_get(value, default):
         return default if value is None else value
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_ENCODING_FORMATS, [scope._kwargs.get('encoding_format', 'float')])
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_USER, safe_get(scope._kwargs.get('user'), ''))
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_ENCODING_FORMATS,
+        [scope._kwargs.get("encoding_format", "float")],
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_USER, safe_get(scope._kwargs.get("user"), "")
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Content
     if capture_message_content:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, str(scope._kwargs.get('input', '')))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_PROMPT,
+            str(scope._kwargs.get("input", "")),
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
             name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
             attributes={
-                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(scope._kwargs.get('input', '')),
+                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(
+                    scope._kwargs.get("input", "")
+                ),
             },
         )
@@ -290,8 +480,20 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     # Metrics
     if not disable_metrics:
-        record_embedding_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING, SemanticConvention.GEN_AI_SYSTEM_LITELLM,
-            scope._server_address, scope._server_port, request_model, scope._response_model, environment,
-            application_name, scope._start_time, scope._end_time, scope._input_tokens, cost)
+        record_embedding_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+            SemanticConvention.GEN_AI_SYSTEM_LITELLM,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            scope._response_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            cost,
+        )
     return response

openlit 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl