PyPI - openlit - Versions diffs - 1.34.13__py3-none-any.whl → 1.34.15__py3-none-any.whl - Mend

openlit 1.34.13py3-none-any.whl → 1.34.15py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

openlit/instrumentation/litellm/__init__.py +7 -6
openlit/instrumentation/litellm/async_litellm.py +89 -493
openlit/instrumentation/litellm/litellm.py +87 -491
openlit/instrumentation/litellm/utils.py +288 -0
openlit/instrumentation/transformers/__init__.py +12 -5
openlit/instrumentation/transformers/transformers.py +21 -28
openlit/instrumentation/transformers/utils.py +126 -110
{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/METADATA +1 -1
{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/RECORD +11 -10
{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/LICENSE +0 -0
{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/WHEEL +0 -0

openlit/instrumentation/transformers/utils.py CHANGED Viewed

@@ -3,19 +3,61 @@ HF Transformers OpenTelemetry instrumentation utility functions
 """
 import time
-from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
 from opentelemetry.trace import Status, StatusCode
 from openlit.__helpers import (
-    response_as_dict,
-    calculate_tbt,
     general_tokens,
     get_chat_model_cost,
-    create_metrics_attributes,
-    format_and_concatenate
+    common_span_attributes,
+    record_completion_metrics,
 )
 from openlit.semcov import SemanticConvention
+def format_content(content):
+    """
+    Format content to a consistent structure.
+    """
+    if isinstance(content, str):
+        return content
+    elif isinstance(content, list):
+        # Check if its a list of chat messages (like in the test case)
+        if (len(content) > 0 and isinstance(content[0], dict) and
+            "role" in content[0] and "content" in content[0]):
+            # Handle chat message format like Groq
+            formatted_messages = []
+            for message in content:
+                role = message["role"]
+                msg_content = message["content"]
+                if isinstance(msg_content, list):
+                    content_str = ", ".join(
+                        f'{item["type"]}: {item["text"] if "text" in item else item.get("image_url", str(item))}'
+                        if isinstance(item, dict) and "type" in item
+                        else str(item)
+                        for item in msg_content
+                    )
+                    formatted_messages.append(f"{role}: {content_str}")
+                else:
+                    formatted_messages.append(f"{role}: {msg_content}")
+            return "\n".join(formatted_messages)
+        else:
+            # Handle other list formats (transformers responses)
+            formatted_content = []
+            for item in content:
+                if isinstance(item, str):
+                    formatted_content.append(item)
+                elif isinstance(item, dict):
+                    # Handle dict format for transformers
+                    if "generated_text" in item:
+                        formatted_content.append(str(item["generated_text"]))
+                    else:
+                        formatted_content.append(str(item))
+                else:
+                    formatted_content.append(str(item))
+            return " ".join(formatted_content)
+    else:
+        return str(content)
 def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
     capture_message_content, disable_metrics, version, args, kwargs, is_stream):
@@ -24,56 +66,42 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     """
     scope._end_time = time.time()
-    if len(scope._timestamps) > 1:
-        scope._tbt = calculate_tbt(scope._timestamps)
     forward_params = scope._instance._forward_params
     request_model = scope._instance.model.config.name_or_path
     input_tokens = general_tokens(scope._prompt)
-    output_tokens = general_tokens(scope._llmresponse)
+    output_tokens = general_tokens(scope._completion)
     cost = get_chat_model_cost(request_model, pricing_info, input_tokens, output_tokens)
-    # Set Span attributes (OTel Semconv)
-    scope._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OPERATION, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM, SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL, request_model)
-    scope._span.set_attribute(SemanticConvention.SERVER_PORT, scope._server_port)
-    # List of attributes and their config keys
-    attributes = [
-        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, "temperature"),
-        (SemanticConvention.GEN_AI_REQUEST_TOP_K, "top_k"),
-        (SemanticConvention.GEN_AI_REQUEST_TOP_P, "top_p"),
-        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, "max_length"),
-    ]
-    # Set each attribute if the corresponding value exists and is not None
-    for attribute, key in attributes:
-        value = forward_params.get(key)
-        if value is not None:
-            scope._span.set_attribute(attribute, value)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL, request_model)
+    # Common Span Attributes
+    common_span_attributes(scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE,
+        scope._server_address, scope._server_port, request_model, request_model,
+        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    # Set request parameters from forward_params
+    if forward_params.get("temperature") is not None:
+        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, forward_params["temperature"])
+    if forward_params.get("top_k") is not None:
+        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_K, forward_params["top_k"])
+    if forward_params.get("top_p") is not None:
+        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, forward_params["top_p"])
+    if forward_params.get("max_length") is not None:
+        scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, forward_params["max_length"])
+    # Set token usage and cost attributes
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens)
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens)
-    scope._span.set_attribute(SemanticConvention.SERVER_ADDRESS, scope._server_address)
-    scope._span.set_attribute(DEPLOYMENT_ENVIRONMENT, environment)
-    scope._span.set_attribute(SERVICE_NAME, application_name)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM, is_stream)
     scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens)
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT, scope._tbt)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, scope._ttft)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION, version)
-    # To be removed one the change to span_attributes (from span events) is complete
+    # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, scope._prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._completion)
+        # To be removed once the change to span_attributes (from span events) is complete
         scope._span.add_event(
             name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
             attributes={
@@ -83,32 +111,18 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
         scope._span.add_event(
             name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
             attributes={
-                SemanticConvention.GEN_AI_CONTENT_COMPLETION: scope._llmresponse,
+                SemanticConvention.GEN_AI_CONTENT_COMPLETION: scope._completion,
             },
         )
     scope._span.set_status(Status(StatusCode.OK))
+    # Record metrics using the standardized helper function
     if not disable_metrics:
-        metrics_attributes = create_metrics_attributes(
-            service_name=application_name,
-            deployment_environment=environment,
-            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
-            system=SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE,
-            request_model=request_model,
-            server_address=scope._server_address,
-            server_port=scope._server_port,
-            response_model=request_model,
-        )
-        metrics["genai_client_usage_tokens"].record(input_tokens + output_tokens, metrics_attributes)
-        metrics["genai_client_operation_duration"].record(scope._end_time - scope._start_time, metrics_attributes)
-        metrics["genai_server_tbt"].record(scope._tbt, metrics_attributes)
-        metrics["genai_server_ttft"].record(scope._ttft, metrics_attributes)
-        metrics["genai_requests"].add(1, metrics_attributes)
-        metrics["genai_completion_tokens"].add(output_tokens, metrics_attributes)
-        metrics["genai_prompt_tokens"].add(input_tokens, metrics_attributes)
-        metrics["genai_cost"].record(cost, metrics_attributes)
+        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE, scope._server_address, scope._server_port,
+            request_model, request_model, environment, application_name, scope._start_time, scope._end_time,
+            cost, input_tokens, output_tokens, scope._tbt, scope._ttft)
 def process_chat_response(instance, response, request_model, pricing_info, server_port, server_address,
     environment, application_name, metrics, start_time,
@@ -117,67 +131,69 @@ def process_chat_response(instance, response, request_model, pricing_info, serve
     Process chat request and generate Telemetry
     """
-    self = type("GenericScope", (), {})()
-    response_dict = response_as_dict(response)
-    # pylint: disable = no-member
-    self._instance = instance
-    self._start_time = start_time
-    self._end_time = time.time()
-    self._span = span
-    self._timestamps = []
-    self._ttft, self._tbt = self._end_time - self._start_time, 0
-    self._server_address, self._server_port = server_address, server_port
-    self._kwargs = kwargs
-    self._args = args
-    if self._args and len(self._args) > 0:
-        self._prompt = args[0]
+    scope = type("GenericScope", (), {})()
+    scope._instance = instance
+    scope._start_time = start_time
+    scope._end_time = time.time()
+    scope._span = span
+    scope._server_address = server_address
+    scope._server_port = server_port
+    scope._kwargs = kwargs
+    scope._args = args
+    # Extract prompt from args or kwargs
+    if args and len(args) > 0:
+        scope._prompt = args[0]
     else:
-        self._prompt = (
+        scope._prompt = (
             kwargs.get("text_inputs") or
             (kwargs.get("image") and kwargs.get("question") and
-            ("image: " + kwargs.get("image") + " question:" + kwargs.get("question"))) or
+             ("image: " + kwargs.get("image") + " question:" + kwargs.get("question"))) or
             kwargs.get("fallback") or
             ""
         )
-    self._prompt = format_and_concatenate(self._prompt)
-    self._llmresponse = []
-    if self._kwargs.get("task", "text-generation") == "text-generation":
-        first_entry = response_dict[0]
-        if isinstance(first_entry, dict) and isinstance(first_entry.get("generated_text"), list):
-            last_element = first_entry.get("generated_text")[-1]
-            self._llmresponse = last_element.get("content", last_element)
+    scope._prompt = format_content(scope._prompt)
+    # Process response based on task type
+    task = kwargs.get("task", "text-generation")
+    if task == "text-generation":
+        # Handle text generation responses
+        if isinstance(response, list) and len(response) > 0:
+            first_entry = response[0]
+            if isinstance(first_entry, dict):
+                if isinstance(first_entry.get("generated_text"), list):
+                    # Handle nested list format
+                    last_element = first_entry.get("generated_text")[-1]
+                    scope._completion = last_element.get("content", str(last_element))
+                else:
+                    # Handle standard format
+                    scope._completion = first_entry.get("generated_text", "")
+            else:
+                scope._completion = str(first_entry)
         else:
-            def extract_text(entry):
-                if isinstance(entry, dict):
-                    return entry.get("generated_text")
-                if isinstance(entry, list):
-                    return " ".join(
-                        extract_text(sub_entry) for sub_entry in entry if isinstance(sub_entry, dict)
-                    )
-                return ""
-            # Process and collect all generated texts
-            self._llmresponse = [
-                extract_text(entry) for entry in response_dict
-            ]
+            scope._completion = ""
-            # Join all non-empty responses into a single string
-            self._llmresponse = " ".join(filter(None, self._llmresponse))
+    elif task == "automatic-speech-recognition":
+        scope._completion = response.get("text", "") if isinstance(response, dict) else ""
-    elif self._kwargs.get("task", "text-generation") == "automatic-speech-recognition":
-        self._llmresponse = response_dict.get("text", "")
+    elif task == "image-classification":
+        scope._completion = str(response[0]) if isinstance(response, list) and len(response) > 0 else ""
-    elif self._kwargs.get("task", "text-generation") == "image-classification":
-        self._llmresponse = str(response_dict[0])
+    elif task == "visual-question-answering":
+        if isinstance(response, list) and len(response) > 0 and isinstance(response[0], dict):
+            scope._completion = response[0].get("answer", "")
+        else:
+            scope._completion = ""
+    else:
+        # Default handling for other tasks
+        scope._completion = format_content(response)
-    elif self._kwargs.get("task", "text-generation") == "visual-question-answering":
-        self._llmresponse = str(response_dict[0]).get("answer")
+    # Initialize timing attributes
+    scope._tbt = 0
+    scope._ttft = scope._end_time - scope._start_time
-    common_chat_logic(self, pricing_info, environment, application_name, metrics,
-            capture_message_content, disable_metrics, version, args, kwargs, is_stream=False)
+    common_chat_logic(scope, pricing_info, environment, application_name, metrics,
+                     capture_message_content, disable_metrics, version, args, kwargs, is_stream=False)
     return response

{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: openlit
-Version: 1.34.13
+Version: 1.34.15
 Summary: OpenTelemetry-native Auto instrumentation library for monitoring LLM Applications and GPUs, facilitating the integration of observability into your GenAI-driven projects
 License: Apache-2.0
 Keywords: OpenTelemetry,otel,otlp,llm,tracing,openai,anthropic,claude,cohere,llm monitoring,observability,monitoring,gpt,Generative AI,chatGPT,gpu

{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/RECORD RENAMED Viewed

@@ -80,9 +80,10 @@ openlit/instrumentation/langchain/async_langchain.py,sha256=rdk3INGcsxsfzZcoJo0y
 openlit/instrumentation/langchain/langchain.py,sha256=zgfzfOIDsaRoVgWl1T4XX2CLO7ttGOD15TagZtYQ-vE,17012
 openlit/instrumentation/letta/__init__.py,sha256=K8PtRKxuueyqEYE3LzxWJ74IieNKSI6dmk9sNRd8Mt0,3031
 openlit/instrumentation/letta/letta.py,sha256=SCIpJ4tdB1l1BmeQx4raaTS4MQO5X15pLvS4PepEKBE,8481
-openlit/instrumentation/litellm/__init__.py,sha256=qRqfwDMhP5adKGI2vRaelAkN12i0e8jtJrT31VFFM5A,2374
-openlit/instrumentation/litellm/async_litellm.py,sha256=DUUOmkyDAxwgET4euyLTjaYxgWGdg_aMyFGbH__qg1A,30502
-openlit/instrumentation/litellm/litellm.py,sha256=xQSqC1HZu7IUVnFAyD442rC6DdO6TSOV9hUTpyPSKW4,30408
+openlit/instrumentation/litellm/__init__.py,sha256=D47yfDLLEKpkaRAy7_Yif70kj88AGqLQYZAABpTN4sE,2284
+openlit/instrumentation/litellm/async_litellm.py,sha256=6cL_hv9t4tuXkcKZvpTdnb0wGTs54lSwGWCtdYZvyXg,6768
+openlit/instrumentation/litellm/litellm.py,sha256=xLna3I_jcywTtIs1tBjHAQKyKjNM07T8GHX9pIqZcQ0,6664
+openlit/instrumentation/litellm/utils.py,sha256=VMSnYkKn9yZtOphIh2ENNuqJtGjz1fXEYUKi5JGHC7A,13195
 openlit/instrumentation/llamaindex/__init__.py,sha256=2pmd9BKw3ab0OJ4yuJEg0-Jkn_haDbXvbUm5r2-rOCU,2007
 openlit/instrumentation/llamaindex/llamaindex.py,sha256=mdT2TvEWD0D9cEkFjXMeTculNoMWkuJ4mj7QWFnvcqY,4085
 openlit/instrumentation/mem0/__init__.py,sha256=IadP3bKgz2HCbnrh9S7AW24uDauGkzsIWeOQaGkOCc4,2447
@@ -125,9 +126,9 @@ openlit/instrumentation/together/__init__.py,sha256=0UmUqQtppyK3oopb4lTjX2LITgVC
 openlit/instrumentation/together/async_together.py,sha256=0-h5fKw6rIwN_fvWVpGuvVqizIuM9xFCzz8Z4oGgOj0,6822
 openlit/instrumentation/together/together.py,sha256=nY6mzHmHgoMbbnB_9eL0EBQjP0ltJVdkQj4pbamHAj0,6723
 openlit/instrumentation/together/utils.py,sha256=n7r_pM_sqFnJEAkL7OhPydr0Uct0A74vXdcYELdbeW0,14368
-openlit/instrumentation/transformers/__init__.py,sha256=9Ubss5nlumcypxprxff8Fv3sst7II27SsvCzqkBX9Kg,1457
-openlit/instrumentation/transformers/transformers.py,sha256=y--t7PXhUfPC81w-aEE7qowMah3os9gnKBQ5bN4QLGc,1980
-openlit/instrumentation/transformers/utils.py,sha256=3f-ewpUpduaBrTVIFJKaabACjz-6Vf8K7NEU0EzQ4Nk,8042
+openlit/instrumentation/transformers/__init__.py,sha256=hXq0WUZNl6Sz0Ihk29kA9i8Q1j0e1URFb7v7etnQpxI,1511
+openlit/instrumentation/transformers/transformers.py,sha256=MHnHVo_6NP0gSIqxen6qQpCrZ0fs8Ec80EdZumMpVNo,1797
+openlit/instrumentation/transformers/utils.py,sha256=MMy_SyRyDI4X-0mqbBwStac0xabmw0ZRvv_VWLA_Nkg,8426
 openlit/instrumentation/vertexai/__init__.py,sha256=mT28WCBvQfRCkAWGL6bd0EjEPHvMjaNcz6T3jsLZh8k,3745
 openlit/instrumentation/vertexai/async_vertexai.py,sha256=-kpg-eiL76O5_XopUPghCYwJHf0Nrxi00_Z5tCwq6zM,23086
 openlit/instrumentation/vertexai/vertexai.py,sha256=5NB090aWlm9DnlccNNLRO6A97P_RN-JnHb5JS01tYyw,23000
@@ -138,7 +139,7 @@ openlit/otel/events.py,sha256=VrMjTpvnLtYRBHCiFwJojTQqqNpRCxoD4yJYeQrtPsk,3560
 openlit/otel/metrics.py,sha256=GM2PDloBGRhBTkHHkYaqmOwIAQkY124ZhW4sEqW1Fgk,7086
 openlit/otel/tracing.py,sha256=tjV2bEbEDPUB1Z46gE-UsJsb04sRdFrfbhIDkxViZc0,3103
 openlit/semcov/__init__.py,sha256=ptyo37PY-FHDx_PShEvbdns71cD4YvvXw15bCRXKCKM,13461
-openlit-1.34.13.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-openlit-1.34.13.dist-info/METADATA,sha256=4uHfQSKnuT-yfoNz7kj78yd53TBFDCDYVhOIsz7XF8k,23470
-openlit-1.34.13.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
-openlit-1.34.13.dist-info/RECORD,,
+openlit-1.34.15.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+openlit-1.34.15.dist-info/METADATA,sha256=ySa6XC3OrkzTkTgO5r3UV-PCuefnpG6yoAzL2DvZ9aQ,23470
+openlit-1.34.15.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
+openlit-1.34.15.dist-info/RECORD,,

{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/LICENSE RENAMED Viewed

File without changes

{openlit-1.34.13.dist-info → openlit-1.34.15.dist-info}/WHEEL RENAMED Viewed

File without changes

openlit 1.34.13__py3-none-any.whl → 1.34.15__py3-none-any.whl

openlit 1.34.13py3-none-any.whl → 1.34.15py3-none-any.whl