PyPI - openlit - Versions diffs - 1.34.10__py3-none-any.whl → 1.34.12__py3-none-any.whl - Mend

openlit 1.34.10py3-none-any.whl → 1.34.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

openlit/__helpers.py +26 -3
openlit/instrumentation/ai21/__init__.py +10 -8
openlit/instrumentation/ai21/ai21.py +15 -27
openlit/instrumentation/ai21/async_ai21.py +15 -27
openlit/instrumentation/ai21/utils.py +229 -212
openlit/instrumentation/groq/__init__.py +7 -9
openlit/instrumentation/groq/async_groq.py +50 -374
openlit/instrumentation/groq/groq.py +49 -373
openlit/instrumentation/groq/utils.py +199 -0
openlit/instrumentation/ollama/async_ollama.py +3 -2
openlit/instrumentation/ollama/ollama.py +3 -2
openlit/instrumentation/ollama/utils.py +10 -6
openlit/instrumentation/openai/__init__.py +3 -3
openlit/instrumentation/premai/utils.py +3 -73
openlit/instrumentation/reka/utils.py +3 -51
{openlit-1.34.10.dist-info → openlit-1.34.12.dist-info}/METADATA +1 -1
{openlit-1.34.10.dist-info → openlit-1.34.12.dist-info}/RECORD +19 -18
{openlit-1.34.10.dist-info → openlit-1.34.12.dist-info}/LICENSE +0 -0
{openlit-1.34.10.dist-info → openlit-1.34.12.dist-info}/WHEEL +0 -0

openlit/__helpers.py CHANGED Viewed

@@ -346,12 +346,12 @@ def common_span_attributes(scope, gen_ai_operation, gen_ai_system, server_addres
     scope._span.set_attribute(SemanticConvention.SERVER_ADDRESS, server_address)
     scope._span.set_attribute(SemanticConvention.SERVER_PORT, server_port)
     scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL, request_model)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL, scope._response_model)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL, response_model)
     scope._span.set_attribute(DEPLOYMENT_ENVIRONMENT, environment)
     scope._span.set_attribute(SERVICE_NAME, application_name)
     scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM, is_stream)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT, scope._tbt)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, scope._ttft)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT, tbt)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, ttft)
     scope._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION, version)
 def record_completion_metrics(metrics, gen_ai_operation, gen_ai_system, server_address, server_port,
@@ -379,3 +379,26 @@ def record_completion_metrics(metrics, gen_ai_operation, gen_ai_system, server_a
     metrics["genai_completion_tokens"].add(output_tokens, attributes)
     metrics["genai_prompt_tokens"].add(input_tokens, attributes)
     metrics["genai_cost"].record(cost, attributes)
+def record_embedding_metrics(metrics, gen_ai_operation, gen_ai_system, server_address, server_port,
+    request_model, response_model, environment, application_name, start_time, end_time,
+    input_tokens, cost):
+    """
+    Record embedding-specific metrics for the operation.
+    """
+    attributes = create_metrics_attributes(
+        operation=gen_ai_operation,
+        system=gen_ai_system,
+        server_address=server_address,
+        server_port=server_port,
+        request_model=request_model,
+        response_model=response_model,
+        service_name=application_name,
+        deployment_environment=environment,
+    )
+    metrics["genai_client_usage_tokens"].record(input_tokens, attributes)
+    metrics["genai_client_operation_duration"].record(end_time - start_time, attributes)
+    metrics["genai_requests"].add(1, attributes)
+    metrics["genai_prompt_tokens"].add(input_tokens, attributes)
+    metrics["genai_cost"].record(cost, attributes)

openlit/instrumentation/ai21/__init__.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# pylint: disable=useless-return, bad-staticmethod-argument, disable=duplicate-code
 """Initializer of Auto Instrumentation of AI21 Functions"""
 from typing import Collection
@@ -33,34 +32,37 @@ class AI21Instrumentor(BaseInstrumentor):
         disable_metrics = kwargs.get("disable_metrics")
         version = importlib.metadata.version("ai21")
-        #sync
+        # Chat completions
         wrap_function_wrapper(
             "ai21.clients.studio.resources.chat.chat_completions",
             "ChatCompletions.create",
             chat(version, environment, application_name,
-                  tracer, pricing_info, capture_message_content, metrics, disable_metrics),
+                 tracer, pricing_info, capture_message_content, metrics, disable_metrics),
         )
+        # RAG completions
         wrap_function_wrapper(
             "ai21.clients.studio.resources.studio_conversational_rag",
             "StudioConversationalRag.create",
             chat_rag(version, environment, application_name,
-                  tracer, pricing_info, capture_message_content, metrics, disable_metrics),
+                     tracer, pricing_info, capture_message_content, metrics, disable_metrics),
         )
-        #Async
+        # Async chat completions
         wrap_function_wrapper(
             "ai21.clients.studio.resources.chat.async_chat_completions",
             "AsyncChatCompletions.create",
             async_chat(version, environment, application_name,
-                  tracer, pricing_info, capture_message_content, metrics, disable_metrics),
+                       tracer, pricing_info, capture_message_content, metrics, disable_metrics),
         )
+        # Async RAG completions
         wrap_function_wrapper(
             "ai21.clients.studio.resources.studio_conversational_rag",
             "AsyncStudioConversationalRag.create",
             async_chat_rag(version, environment, application_name,
-                  tracer, pricing_info, capture_message_content, metrics, disable_metrics),
+                           tracer, pricing_info, capture_message_content, metrics, disable_metrics),
         )
     def _uninstrument(self, **kwargs):
-        # Proper uninstrumentation logic to revert patched methods
         pass

openlit/instrumentation/ai21/ai21.py CHANGED Viewed

@@ -1,8 +1,7 @@
 """
-Module for monitoring AI21 calls.
+Module for monitoring AI21 API calls.
 """
-import logging
 import time
 from opentelemetry.trace import SpanKind
 from openlit.__helpers import (
@@ -15,14 +14,10 @@ from openlit.instrumentation.ai21.utils import (
     process_streaming_chat_response,
     process_chat_rag_response
 )
 from openlit.semcov import SemanticConvention
-# Initialize logger for logging potential issues and operations
-logger = logging.getLogger(__name__)
-def chat(version, environment, application_name,
-                     tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def chat(version, environment, application_name, tracer, pricing_info,
+    capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for GenAI function call
     """
@@ -45,14 +40,12 @@ def chat(version, environment, application_name,
             self.__wrapped__ = wrapped
             self._span = span
             self._span_name = span_name
-            # Placeholder for aggregating streaming response
             self._llmresponse = ""
             self._response_id = ""
             self._finish_reason = ""
+            self._tools = None
             self._input_tokens = 0
             self._output_tokens = 0
-            self._choices = []
             self._args = args
             self._kwargs = kwargs
             self._start_time = time.time()
@@ -83,9 +76,8 @@ def chat(version, environment, application_name,
                 process_chunk(self, chunk)
                 return chunk
             except StopIteration:
-                # Handling exception ensure observability without disrupting operation
                 try:
-                    with tracer.start_as_current_span(self._span_name, kind= SpanKind.CLIENT) as self._span:
+                    with tracer.start_as_current_span(self._span_name, kind=SpanKind.CLIENT) as self._span:
                         process_streaming_chat_response(
                             self,
                             pricing_info=pricing_info,
@@ -96,34 +88,31 @@ def chat(version, environment, application_name,
                             disable_metrics=disable_metrics,
                             version=version
                         )
                 except Exception as e:
                     handle_exception(self._span, e)
-                    logger.error("Error in trace creation: %s", e)
                 raise
     def wrapper(wrapped, instance, args, kwargs):
         """
         Wraps the GenAI function call.
         """
         # Check if streaming is enabled for the API call
         streaming = kwargs.get("stream", False)
         server_address, server_port = set_server_address_and_port(instance, "api.ai21.com", 443)
         request_model = kwargs.get("model", "jamba-1.5-mini")
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
-        # pylint: disable=no-else-return
         if streaming:
-            # Special handling for streaming response to accommodate the nature of data flow
+            # Special handling for streaming response
             awaited_wrapped = wrapped(*args, **kwargs)
             span = tracer.start_span(span_name, kind=SpanKind.CLIENT)
             return TracedSyncStream(awaited_wrapped, span, span_name, kwargs, server_address, server_port)
-        # Handling for non-streaming responses
         else:
-            with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
+            # Handling for non-streaming responses
+            with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
                 start_time = time.time()
                 response = wrapped(*args, **kwargs)
@@ -152,23 +141,22 @@ def chat(version, environment, application_name,
     return wrapper
-def chat_rag(version, environment, application_name,
-                tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def chat_rag(version, environment, application_name, tracer, pricing_info,
+    capture_message_content, metrics, disable_metrics):
     """
-    Generates a telemetry wrapper for GenAI function call
+    Generates a telemetry wrapper for GenAI RAG function call
     """
     def wrapper(wrapped, instance, args, kwargs):
         """
-        Wraps the GenAI function call.
+        Wraps the GenAI RAG function call.
         """
         server_address, server_port = set_server_address_and_port(instance, "api.ai21.com", 443)
         request_model = kwargs.get("model", "jamba-1.5-mini")
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
-        with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
+        with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
             start_time = time.time()
             response = wrapped(*args, **kwargs)

openlit/instrumentation/ai21/async_ai21.py CHANGED Viewed

@@ -1,8 +1,7 @@
 """
-Module for monitoring AI21 calls.
+Module for monitoring AI21 API calls (async version).
 """
-import logging
 import time
 from opentelemetry.trace import SpanKind
 from openlit.__helpers import (
@@ -15,21 +14,17 @@ from openlit.instrumentation.ai21.utils import (
     process_streaming_chat_response,
     process_chat_rag_response
 )
 from openlit.semcov import SemanticConvention
-# Initialize logger for logging potential issues and operations
-logger = logging.getLogger(__name__)
-def async_chat(version, environment, application_name,
-                     tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def async_chat(version, environment, application_name, tracer, pricing_info,
+    capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for GenAI function call
     """
     class TracedAsyncStream:
         """
-        Wrapper for streaming responses to collect telemetry.
+        Wrapper for async streaming responses to collect telemetry.
         """
         def __init__(
@@ -45,14 +40,12 @@ def async_chat(version, environment, application_name,
             self.__wrapped__ = wrapped
             self._span = span
             self._span_name = span_name
-            # Placeholder for aggregating streaming response
             self._llmresponse = ""
             self._response_id = ""
             self._finish_reason = ""
+            self._tools = None
             self._input_tokens = 0
             self._output_tokens = 0
-            self._choices = []
             self._args = args
             self._kwargs = kwargs
             self._start_time = time.time()
@@ -83,9 +76,8 @@ def async_chat(version, environment, application_name,
                 process_chunk(self, chunk)
                 return chunk
             except StopAsyncIteration:
-                # Handling exception ensure observability without disrupting operation
                 try:
-                    with tracer.start_as_current_span(self._span_name, kind= SpanKind.CLIENT) as self._span:
+                    with tracer.start_as_current_span(self._span_name, kind=SpanKind.CLIENT) as self._span:
                         process_streaming_chat_response(
                             self,
                             pricing_info=pricing_info,
@@ -96,6 +88,7 @@ def async_chat(version, environment, application_name,
                             disable_metrics=disable_metrics,
                             version=version
                         )
                 except Exception as e:
                     handle_exception(self._span, e)
@@ -105,25 +98,21 @@ def async_chat(version, environment, application_name,
         """
         Wraps the GenAI function call.
         """
         # Check if streaming is enabled for the API call
         streaming = kwargs.get("stream", False)
         server_address, server_port = set_server_address_and_port(instance, "api.ai21.com", 443)
         request_model = kwargs.get("model", "jamba-1.5-mini")
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
-        # pylint: disable=no-else-return
         if streaming:
-            # Special handling for streaming response to accommodate the nature of data flow
+            # Special handling for streaming response
             awaited_wrapped = await wrapped(*args, **kwargs)
             span = tracer.start_span(span_name, kind=SpanKind.CLIENT)
             return TracedAsyncStream(awaited_wrapped, span, span_name, kwargs, server_address, server_port)
-        # Handling for non-streaming responses
         else:
-            with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
+            # Handling for non-streaming responses
+            with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
                 start_time = time.time()
                 response = await wrapped(*args, **kwargs)
@@ -152,23 +141,22 @@ def async_chat(version, environment, application_name,
     return wrapper
-def async_chat_rag(version, environment, application_name,
-                tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def async_chat_rag(version, environment, application_name, tracer, pricing_info,
+    capture_message_content, metrics, disable_metrics):
     """
-    Generates a telemetry wrapper for GenAI function call
+    Generates a telemetry wrapper for GenAI RAG function call
     """
     async def wrapper(wrapped, instance, args, kwargs):
         """
-        Wraps the GenAI function call.
+        Wraps the GenAI RAG function call.
         """
         server_address, server_port = set_server_address_and_port(instance, "api.ai21.com", 443)
         request_model = kwargs.get("model", "jamba-1.5-mini")
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
-        with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
+        with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
             start_time = time.time()
             response = await wrapped(*args, **kwargs)

openlit 1.34.10__py3-none-any.whl → 1.34.12__py3-none-any.whl

openlit 1.34.10py3-none-any.whl → 1.34.12py3-none-any.whl