PyPI - openlit - Versions diffs - 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl - Mend

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

openlit/__helpers.py +235 -86
openlit/__init__.py +16 -13
openlit/_instrumentors.py +2 -1
openlit/evals/all.py +50 -21
openlit/evals/bias_detection.py +47 -20
openlit/evals/hallucination.py +53 -22
openlit/evals/toxicity.py +50 -21
openlit/evals/utils.py +54 -30
openlit/guard/all.py +61 -19
openlit/guard/prompt_injection.py +34 -14
openlit/guard/restrict_topic.py +46 -15
openlit/guard/sensitive_topic.py +34 -14
openlit/guard/utils.py +58 -22
openlit/instrumentation/ag2/__init__.py +24 -8
openlit/instrumentation/ag2/ag2.py +34 -13
openlit/instrumentation/ag2/async_ag2.py +34 -13
openlit/instrumentation/ag2/utils.py +133 -30
openlit/instrumentation/ai21/__init__.py +43 -14
openlit/instrumentation/ai21/ai21.py +47 -21
openlit/instrumentation/ai21/async_ai21.py +47 -21
openlit/instrumentation/ai21/utils.py +299 -78
openlit/instrumentation/anthropic/__init__.py +21 -4
openlit/instrumentation/anthropic/anthropic.py +28 -17
openlit/instrumentation/anthropic/async_anthropic.py +28 -17
openlit/instrumentation/anthropic/utils.py +145 -35
openlit/instrumentation/assemblyai/__init__.py +11 -2
openlit/instrumentation/assemblyai/assemblyai.py +15 -4
openlit/instrumentation/assemblyai/utils.py +120 -25
openlit/instrumentation/astra/__init__.py +43 -10
openlit/instrumentation/astra/astra.py +28 -5
openlit/instrumentation/astra/async_astra.py +28 -5
openlit/instrumentation/astra/utils.py +151 -55
openlit/instrumentation/azure_ai_inference/__init__.py +43 -10
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/utils.py +307 -83
openlit/instrumentation/bedrock/__init__.py +21 -4
openlit/instrumentation/bedrock/bedrock.py +63 -25
openlit/instrumentation/bedrock/utils.py +139 -30
openlit/instrumentation/chroma/__init__.py +89 -16
openlit/instrumentation/chroma/chroma.py +28 -6
openlit/instrumentation/chroma/utils.py +167 -51
openlit/instrumentation/cohere/__init__.py +63 -18
openlit/instrumentation/cohere/async_cohere.py +63 -24
openlit/instrumentation/cohere/cohere.py +63 -24
openlit/instrumentation/cohere/utils.py +286 -73
openlit/instrumentation/controlflow/__init__.py +35 -9
openlit/instrumentation/controlflow/controlflow.py +66 -33
openlit/instrumentation/crawl4ai/__init__.py +25 -10
openlit/instrumentation/crawl4ai/async_crawl4ai.py +78 -31
openlit/instrumentation/crawl4ai/crawl4ai.py +78 -31
openlit/instrumentation/crewai/__init__.py +40 -15
openlit/instrumentation/crewai/async_crewai.py +32 -7
openlit/instrumentation/crewai/crewai.py +32 -7
openlit/instrumentation/crewai/utils.py +159 -56
openlit/instrumentation/dynamiq/__init__.py +46 -12
openlit/instrumentation/dynamiq/dynamiq.py +74 -33
openlit/instrumentation/elevenlabs/__init__.py +23 -4
openlit/instrumentation/elevenlabs/async_elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/utils.py +128 -25
openlit/instrumentation/embedchain/__init__.py +11 -2
openlit/instrumentation/embedchain/embedchain.py +68 -35
openlit/instrumentation/firecrawl/__init__.py +24 -7
openlit/instrumentation/firecrawl/firecrawl.py +46 -20
openlit/instrumentation/google_ai_studio/__init__.py +45 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/utils.py +180 -67
openlit/instrumentation/gpt4all/__init__.py +22 -7
openlit/instrumentation/gpt4all/gpt4all.py +67 -29
openlit/instrumentation/gpt4all/utils.py +285 -61
openlit/instrumentation/gpu/__init__.py +128 -47
openlit/instrumentation/groq/__init__.py +21 -4
openlit/instrumentation/groq/async_groq.py +33 -21
openlit/instrumentation/groq/groq.py +33 -21
openlit/instrumentation/groq/utils.py +192 -55
openlit/instrumentation/haystack/__init__.py +70 -24
openlit/instrumentation/haystack/async_haystack.py +28 -6
openlit/instrumentation/haystack/haystack.py +28 -6
openlit/instrumentation/haystack/utils.py +196 -74
openlit/instrumentation/julep/__init__.py +69 -19
openlit/instrumentation/julep/async_julep.py +53 -27
openlit/instrumentation/julep/julep.py +53 -28
openlit/instrumentation/langchain/__init__.py +74 -63
openlit/instrumentation/langchain/callback_handler.py +1100 -0
openlit/instrumentation/langchain_community/__init__.py +13 -2
openlit/instrumentation/langchain_community/async_langchain_community.py +23 -5
openlit/instrumentation/langchain_community/langchain_community.py +23 -5
openlit/instrumentation/langchain_community/utils.py +35 -9
openlit/instrumentation/letta/__init__.py +68 -15
openlit/instrumentation/letta/letta.py +99 -54
openlit/instrumentation/litellm/__init__.py +43 -14
openlit/instrumentation/litellm/async_litellm.py +51 -26
openlit/instrumentation/litellm/litellm.py +51 -26
openlit/instrumentation/litellm/utils.py +304 -102
openlit/instrumentation/llamaindex/__init__.py +267 -90
openlit/instrumentation/llamaindex/async_llamaindex.py +28 -6
openlit/instrumentation/llamaindex/llamaindex.py +28 -6
openlit/instrumentation/llamaindex/utils.py +204 -91
openlit/instrumentation/mem0/__init__.py +11 -2
openlit/instrumentation/mem0/mem0.py +50 -29
openlit/instrumentation/milvus/__init__.py +10 -2
openlit/instrumentation/milvus/milvus.py +31 -6
openlit/instrumentation/milvus/utils.py +166 -67
openlit/instrumentation/mistral/__init__.py +63 -18
openlit/instrumentation/mistral/async_mistral.py +63 -24
openlit/instrumentation/mistral/mistral.py +63 -24
openlit/instrumentation/mistral/utils.py +277 -69
openlit/instrumentation/multion/__init__.py +69 -19
openlit/instrumentation/multion/async_multion.py +57 -26
openlit/instrumentation/multion/multion.py +57 -26
openlit/instrumentation/ollama/__init__.py +39 -18
openlit/instrumentation/ollama/async_ollama.py +57 -26
openlit/instrumentation/ollama/ollama.py +57 -26
openlit/instrumentation/ollama/utils.py +226 -50
openlit/instrumentation/openai/__init__.py +156 -32
openlit/instrumentation/openai/async_openai.py +147 -67
openlit/instrumentation/openai/openai.py +150 -67
openlit/instrumentation/openai/utils.py +657 -185
openlit/instrumentation/openai_agents/__init__.py +5 -1
openlit/instrumentation/openai_agents/processor.py +110 -90
openlit/instrumentation/phidata/__init__.py +13 -5
openlit/instrumentation/phidata/phidata.py +67 -32
openlit/instrumentation/pinecone/__init__.py +48 -9
openlit/instrumentation/pinecone/async_pinecone.py +27 -5
openlit/instrumentation/pinecone/pinecone.py +27 -5
openlit/instrumentation/pinecone/utils.py +153 -47
openlit/instrumentation/premai/__init__.py +22 -7
openlit/instrumentation/premai/premai.py +51 -26
openlit/instrumentation/premai/utils.py +246 -59
openlit/instrumentation/pydantic_ai/__init__.py +49 -22
openlit/instrumentation/pydantic_ai/pydantic_ai.py +69 -16
openlit/instrumentation/pydantic_ai/utils.py +89 -24
openlit/instrumentation/qdrant/__init__.py +19 -4
openlit/instrumentation/qdrant/async_qdrant.py +33 -7
openlit/instrumentation/qdrant/qdrant.py +33 -7
openlit/instrumentation/qdrant/utils.py +228 -93
openlit/instrumentation/reka/__init__.py +23 -10
openlit/instrumentation/reka/async_reka.py +17 -11
openlit/instrumentation/reka/reka.py +17 -11
openlit/instrumentation/reka/utils.py +138 -36
openlit/instrumentation/together/__init__.py +44 -12
openlit/instrumentation/together/async_together.py +50 -27
openlit/instrumentation/together/together.py +50 -27
openlit/instrumentation/together/utils.py +301 -71
openlit/instrumentation/transformers/__init__.py +2 -1
openlit/instrumentation/transformers/transformers.py +13 -3
openlit/instrumentation/transformers/utils.py +139 -36
openlit/instrumentation/vertexai/__init__.py +81 -16
openlit/instrumentation/vertexai/async_vertexai.py +33 -15
openlit/instrumentation/vertexai/utils.py +123 -27
openlit/instrumentation/vertexai/vertexai.py +33 -15
openlit/instrumentation/vllm/__init__.py +12 -5
openlit/instrumentation/vllm/utils.py +121 -31
openlit/instrumentation/vllm/vllm.py +16 -10
openlit/otel/events.py +35 -10
openlit/otel/metrics.py +32 -24
openlit/otel/tracing.py +24 -9
openlit/semcov/__init__.py +72 -6
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/METADATA +2 -1
openlit-1.34.31.dist-info/RECORD +166 -0
openlit/instrumentation/langchain/async_langchain.py +0 -102
openlit/instrumentation/langchain/langchain.py +0 -102
openlit/instrumentation/langchain/utils.py +0 -252
openlit-1.34.30.dist-info/RECORD +0 -168
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/LICENSE +0 -0
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/WHEEL +0 -0

openlit/instrumentation/vertexai/utils.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """
 VertexAI OpenTelemetry instrumentation utility functions
 """
 import time
 from opentelemetry.trace import Status, StatusCode
@@ -14,6 +15,7 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def format_content(contents):
     """
     Format the VertexAI contents into a string for span events.
@@ -37,7 +39,9 @@ def format_content(contents):
             if part.thought:
                 content_str.append(f"thought: {part.thought}")
             if part.code_execution_result:
-                content_str.append(f"code_execution_result: {part.code_execution_result}")
+                content_str.append(
+                    f"code_execution_result: {part.code_execution_result}"
+                )
             if part.executable_code:
                 content_str.append(f"executable_code: {part.executable_code}")
             if part.file_data:
@@ -53,6 +57,7 @@ def format_content(contents):
     return "\n".join(formatted_messages)
 def process_chunk(scope, chunk):
     """
     Process a chunk of response data and update state.
@@ -71,8 +76,18 @@ def process_chunk(scope, chunk):
     scope._input_tokens = chunk.usage_metadata.prompt_token_count
     scope._output_tokens = chunk.usage_metadata.candidates_token_count
-def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-                        capture_message_content, disable_metrics, version, is_stream):
+def common_chat_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -86,13 +101,26 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     formatted_messages = format_content(contents)
     prompt = formatted_messages or str(scope._args[0][0])
-    cost = get_chat_model_cost(scope._request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    cost = get_chat_model_cost(
+        scope._request_model, pricing_info, scope._input_tokens, scope._output_tokens
+    )
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
-        scope._server_address, scope._server_port, scope._request_model, scope._request_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
+        scope._server_address,
+        scope._server_port,
+        scope._request_model,
+        scope._request_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Span Attributes for Request parameters (VertexAI-specific)
     inference_config = scope._kwargs.get("generation_config", {})
@@ -115,18 +143,30 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
             scope._span.set_attribute(attribute, value)
     # Span Attributes for Response parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
+        scope._input_tokens + scope._output_tokens,
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -146,23 +186,69 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     # Record metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
-            scope._server_address, scope._server_port, scope._request_model, scope._request_model, environment,
-            application_name, scope._start_time, scope._end_time, scope._input_tokens, scope._output_tokens,
-            cost, scope._tbt, scope._ttft)
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
+            scope._server_address,
+            scope._server_port,
+            scope._request_model,
+            scope._request_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            scope._input_tokens,
+            scope._output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
-def process_streaming_chat_response(scope, pricing_info, environment, application_name, metrics,
-                                    capture_message_content=False, disable_metrics=False, version=""):
+def process_streaming_chat_response(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="",
+):
     """
     Process streaming chat response and generate telemetry.
     """
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-                        capture_message_content, disable_metrics, version, is_stream=True)
-def process_chat_response(response, request_model, pricing_info, server_port, server_address,
-                          environment, application_name, metrics, start_time,
-                          span, capture_message_content=False, disable_metrics=False, version="1.0.0", **kwargs):
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=True,
+    )
+def process_chat_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process non-streaming chat response and generate telemetry.
     """
@@ -182,11 +268,21 @@ def process_chat_response(response, request_model, pricing_info, server_port, se
     scope._kwargs = kwargs
     scope._args = [kwargs.get("contents", [])]
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-                        capture_message_content, disable_metrics, version, is_stream=False)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response
 def extract_vertexai_details(instance):
     """
     Extract VertexAI-specific details like location and model name.

openlit/instrumentation/vertexai/vertexai.py CHANGED Viewed

@@ -19,8 +19,17 @@ from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
-def send_message(version, environment, application_name, tracer,
-             pricing_info, capture_message_content, metrics, disable_metrics):
+def send_message(
+    version,
+    environment,
+    application_name,
+    tracer,
+    pricing_info,
+    capture_message_content,
+    metrics,
+    disable_metrics,
+):
     """
     Generates a telemetry wrapper for VertexAI messages to collect metrics.
     """
@@ -31,16 +40,16 @@ def send_message(version, environment, application_name, tracer,
         """
         def __init__(
-                self,
-                wrapped,
-                span,
-                span_name,
-                kwargs,
-                server_address,
-                server_port,
-                request_model,
-                args,
-            ):
+            self,
+            wrapped,
+            span,
+            span_name,
+            kwargs,
+            server_address,
+            server_port,
+            request_model,
+            args,
+        ):
             self.__wrapped__ = wrapped
             self._span = span
             self._span_name = span_name
@@ -88,7 +97,7 @@ def send_message(version, environment, application_name, tracer,
                             metrics=metrics,
                             capture_message_content=capture_message_content,
                             disable_metrics=disable_metrics,
-                            version=version
+                            version=version,
                         )
                 except Exception as e:
                     handle_exception(self._span, e)
@@ -108,7 +117,16 @@ def send_message(version, environment, application_name, tracer,
             awaited_wrapped = wrapped(*args, **kwargs)
             span = tracer.start_span(span_name, kind=SpanKind.CLIENT)
-            return TracedSyncStream(awaited_wrapped, span, span_name, kwargs, server_address, server_port, request_model, args)
+            return TracedSyncStream(
+                awaited_wrapped,
+                span,
+                span_name,
+                kwargs,
+                server_address,
+                server_port,
+                request_model,
+                args,
+            )
         else:
             with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
@@ -130,7 +148,7 @@ def send_message(version, environment, application_name, tracer,
                         capture_message_content=capture_message_content,
                         disable_metrics=disable_metrics,
                         version=version,
-                        **kwargs
+                        **kwargs,
                     )
                 except Exception as e:

openlit/instrumentation/vllm/__init__.py CHANGED Viewed

@@ -5,12 +5,11 @@ import importlib.metadata
 from opentelemetry.instrumentation.instrumentor import BaseInstrumentor
 from wrapt import wrap_function_wrapper
-from openlit.instrumentation.vllm.vllm import (
-    generate
-)
+from openlit.instrumentation.vllm.vllm import generate
 _instruments = ("vllm >= 0.5.4",)
 class VLLMInstrumentor(BaseInstrumentor):
     """
     An instrumentor for vLLM client library.
@@ -33,8 +32,16 @@ class VLLMInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "vllm.entrypoints.llm",
             "LLM.generate",
-            generate(version, environment, application_name,
-                     tracer, pricing_info, capture_message_content, metrics, disable_metrics),
+            generate(
+                version,
+                environment,
+                application_name,
+                tracer,
+                pricing_info,
+                capture_message_content,
+                metrics,
+                disable_metrics,
+            ),
         )
     def _uninstrument(self, **kwargs):

openlit/instrumentation/vllm/utils.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """
 vLLM OpenTelemetry instrumentation utility functions
 """
 import time
 from opentelemetry.trace import Status, StatusCode
@@ -13,17 +14,19 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def get_inference_config(args, kwargs):
     """
     Safely extract inference configuration from args or kwargs.
     """
-    if 'sampling_params' in kwargs:
-        return kwargs['sampling_params']
+    if "sampling_params" in kwargs:
+        return kwargs["sampling_params"]
     if len(args) > 1:
         return args[1]
     return None
 def format_content(prompts):
     """
     Process a list of prompts to extract content.
@@ -36,8 +39,18 @@ def format_content(prompts):
     else:
         return str(prompts)
-def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version, is_stream):
+def common_chat_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process chat request and generate Telemetry
     """
@@ -60,37 +73,75 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     cost = get_chat_model_cost(request_model, pricing_info, input_tokens, output_tokens)
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_VLLM,
-        scope._server_address, scope._server_port, request_model, request_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_VLLM,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        request_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Span Attributes for Request parameters
     inference_config = get_inference_config(scope._args, scope._kwargs)
     if inference_config:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, getattr(inference_config, 'max_tokens', -1))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, getattr(inference_config, 'stop_sequences', []))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, getattr(inference_config, 'temperature', 1.0))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, getattr(inference_config, 'top_p', 1.0))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_K, getattr(inference_config, 'top_k', -1))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
-            getattr(inference_config, 'presence_penalty', 0.0))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
-            getattr(inference_config, 'frequency_penalty', 0.0))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
+            getattr(inference_config, "max_tokens", -1),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES,
+            getattr(inference_config, "stop_sequences", []),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
+            getattr(inference_config, "temperature", 1.0),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_TOP_P,
+            getattr(inference_config, "top_p", 1.0),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_TOP_K,
+            getattr(inference_config, "top_k", -1),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
+            getattr(inference_config, "presence_penalty", 0.0),
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+            getattr(inference_config, "frequency_penalty", 0.0),
+        )
     # Span Attributes for Response parameters
     scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text")
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, completion)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, completion
+        )
         # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -110,14 +161,44 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_VLLM,
-            scope._server_address, scope._server_port, request_model, request_model, environment,
-            application_name, scope._start_time, scope._end_time, input_tokens, output_tokens,
-            cost, scope._tbt, scope._ttft)
-def process_chat_response(instance, response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, args, kwargs,
-    capture_message_content=False, disable_metrics=False, version="1.0.0"):
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_VLLM,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            request_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            input_tokens,
+            output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
+def process_chat_response(
+    instance,
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    args,
+    kwargs,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+):
     """
     Process chat request and generate Telemetry
     """
@@ -137,7 +218,16 @@ def process_chat_response(instance, response, request_model, pricing_info, serve
     scope._args = args
     scope._kwargs = kwargs
-    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=False)
+    common_chat_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response

openlit/instrumentation/vllm/vllm.py CHANGED Viewed

@@ -4,17 +4,21 @@ Module for monitoring vLLM API calls.
 import time
 from opentelemetry.trace import SpanKind
-from openlit.__helpers import (
-    handle_exception,
-    set_server_address_and_port
-)
-from openlit.instrumentation.vllm.utils import (
-    process_chat_response
-)
+from openlit.__helpers import handle_exception, set_server_address_and_port
+from openlit.instrumentation.vllm.utils import process_chat_response
 from openlit.semcov import SemanticConvention
-def generate(version, environment, application_name, tracer, pricing_info,
-             capture_message_content, metrics, disable_metrics):
+def generate(
+    version,
+    environment,
+    application_name,
+    tracer,
+    pricing_info,
+    capture_message_content,
+    metrics,
+    disable_metrics,
+):
     """
     Generates a telemetry wrapper for GenAI function call
     """
@@ -23,7 +27,9 @@ def generate(version, environment, application_name, tracer, pricing_info,
         """
         Wraps the GenAI function call.
         """
-        server_address, server_port = set_server_address_and_port(instance, "http://127.0.0.1", 443)
+        server_address, server_port = set_server_address_and_port(
+            instance, "http://127.0.0.1", 443
+        )
         request_model = instance.llm_engine.model_config.model or "facebook/opt-125m"
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"

openlit/otel/events.py CHANGED Viewed

@@ -4,10 +4,17 @@ Setups up OpenTelemetry events emitter
 import os
 from opentelemetry import _events, _logs
-from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from opentelemetry.sdk.resources import (
+    SERVICE_NAME,
+    TELEMETRY_SDK_NAME,
+    DEPLOYMENT_ENVIRONMENT,
+)
 from opentelemetry.sdk.resources import Resource
 from opentelemetry.sdk._events import EventLoggerProvider
-from opentelemetry.sdk._logs.export import BatchLogRecordProcessor, SimpleLogRecordProcessor
+from opentelemetry.sdk._logs.export import (
+    BatchLogRecordProcessor,
+    SimpleLogRecordProcessor,
+)
 from opentelemetry.sdk._logs import LoggerProvider
 from opentelemetry.sdk._logs.export import ConsoleLogExporter
@@ -19,7 +26,15 @@ else:
 # Global flag to check if the events provider initialization is complete.
 EVENTS_SET = False
-def setup_events(application_name, environment, event_logger, otlp_endpoint, otlp_headers, disable_batch):
+def setup_events(
+    application_name,
+    environment,
+    event_logger,
+    otlp_endpoint,
+    otlp_headers,
+    disable_batch,
+):
     """Setup OpenTelemetry events with the given configuration.
     Args:
@@ -42,10 +57,12 @@ def setup_events(application_name, environment, event_logger, otlp_endpoint, otl
     try:
         if not EVENTS_SET:
             # Create resource with service and environment information
-            resource = Resource.create(attributes={
-                SERVICE_NAME: application_name,
-                DEPLOYMENT_ENVIRONMENT: environment,
-                TELEMETRY_SDK_NAME: "openlit"}
+            resource = Resource.create(
+                attributes={
+                    SERVICE_NAME: application_name,
+                    DEPLOYMENT_ENVIRONMENT: environment,
+                    TELEMETRY_SDK_NAME: "openlit",
+                }
             )
             # Initialize the LoggerProvider with the created resource.
@@ -57,7 +74,9 @@ def setup_events(application_name, environment, event_logger, otlp_endpoint, otl
             if otlp_headers is not None:
                 if isinstance(otlp_headers, dict):
-                    headers_str = ','.join(f"{key}={value}" for key, value in otlp_headers.items())
+                    headers_str = ",".join(
+                        f"{key}={value}" for key, value in otlp_headers.items()
+                    )
                 else:
                     headers_str = otlp_headers
@@ -67,10 +86,16 @@ def setup_events(application_name, environment, event_logger, otlp_endpoint, otl
             if os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT"):
                 event_exporter = OTLPLogExporter()
                 # pylint: disable=line-too-long
-                logger_provider.add_log_record_processor(SimpleLogRecordProcessor(event_exporter)) if disable_batch else logger_provider.add_log_record_processor(BatchLogRecordProcessor(event_exporter))
+                logger_provider.add_log_record_processor(
+                    SimpleLogRecordProcessor(event_exporter)
+                ) if disable_batch else logger_provider.add_log_record_processor(
+                    BatchLogRecordProcessor(event_exporter)
+                )
             else:
                 event_exporter = ConsoleLogExporter()
-                logger_provider.add_log_record_processor(SimpleLogRecordProcessor(event_exporter))
+                logger_provider.add_log_record_processor(
+                    SimpleLogRecordProcessor(event_exporter)
+                )
             _logs.set_logger_provider(logger_provider)
             event_provider = EventLoggerProvider()

openlit 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl