PyPI - openlit - Versions diffs - 1.33.8__py3-none-any.whl → 1.33.9__py3-none-any.whl - Mend

openlit 1.33.8py3-none-any.whl → 1.33.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

openlit/__helpers.py +83 -0
openlit/__init__.py +1 -1
openlit/instrumentation/ag2/ag2.py +2 -2
openlit/instrumentation/ai21/__init__.py +4 -4
openlit/instrumentation/ai21/ai21.py +370 -319
openlit/instrumentation/ai21/async_ai21.py +371 -319
openlit/instrumentation/anthropic/__init__.py +4 -4
openlit/instrumentation/anthropic/anthropic.py +321 -189
openlit/instrumentation/anthropic/async_anthropic.py +323 -190
openlit/instrumentation/assemblyai/__init__.py +1 -1
openlit/instrumentation/assemblyai/assemblyai.py +59 -43
openlit/instrumentation/astra/astra.py +4 -4
openlit/instrumentation/astra/async_astra.py +4 -4
openlit/instrumentation/azure_ai_inference/__init__.py +4 -4
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +406 -252
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +406 -252
openlit/instrumentation/bedrock/__init__.py +1 -1
openlit/instrumentation/bedrock/bedrock.py +115 -58
openlit/instrumentation/chroma/chroma.py +4 -4
openlit/instrumentation/cohere/__init__.py +33 -10
openlit/instrumentation/cohere/async_cohere.py +610 -0
openlit/instrumentation/cohere/cohere.py +410 -219
openlit/instrumentation/controlflow/controlflow.py +2 -2
openlit/instrumentation/crawl4ai/async_crawl4ai.py +2 -2
openlit/instrumentation/crawl4ai/crawl4ai.py +2 -2
openlit/instrumentation/crewai/crewai.py +2 -2
openlit/instrumentation/dynamiq/dynamiq.py +2 -2
openlit/instrumentation/elevenlabs/async_elevenlabs.py +73 -47
openlit/instrumentation/elevenlabs/elevenlabs.py +73 -52
openlit/instrumentation/embedchain/embedchain.py +4 -4
openlit/instrumentation/firecrawl/firecrawl.py +2 -2
openlit/instrumentation/google_ai_studio/__init__.py +9 -9
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +183 -219
openlit/instrumentation/google_ai_studio/google_ai_studio.py +183 -220
openlit/instrumentation/gpt4all/gpt4all.py +17 -17
openlit/instrumentation/groq/async_groq.py +14 -14
openlit/instrumentation/groq/groq.py +14 -14
openlit/instrumentation/haystack/haystack.py +2 -2
openlit/instrumentation/julep/async_julep.py +2 -2
openlit/instrumentation/julep/julep.py +2 -2
openlit/instrumentation/langchain/langchain.py +36 -31
openlit/instrumentation/letta/letta.py +6 -6
openlit/instrumentation/litellm/async_litellm.py +20 -20
openlit/instrumentation/litellm/litellm.py +20 -20
openlit/instrumentation/llamaindex/llamaindex.py +2 -2
openlit/instrumentation/mem0/mem0.py +2 -2
openlit/instrumentation/milvus/milvus.py +4 -4
openlit/instrumentation/mistral/async_mistral.py +18 -18
openlit/instrumentation/mistral/mistral.py +18 -18
openlit/instrumentation/multion/async_multion.py +2 -2
openlit/instrumentation/multion/multion.py +2 -2
openlit/instrumentation/ollama/async_ollama.py +29 -29
openlit/instrumentation/ollama/ollama.py +29 -29
openlit/instrumentation/openai/__init__.py +11 -230
openlit/instrumentation/openai/async_openai.py +434 -409
openlit/instrumentation/openai/openai.py +415 -393
openlit/instrumentation/phidata/phidata.py +2 -2
openlit/instrumentation/pinecone/pinecone.py +4 -4
openlit/instrumentation/premai/premai.py +20 -20
openlit/instrumentation/qdrant/async_qdrant.py +4 -4
openlit/instrumentation/qdrant/qdrant.py +4 -4
openlit/instrumentation/reka/async_reka.py +6 -6
openlit/instrumentation/reka/reka.py +6 -6
openlit/instrumentation/together/async_together.py +18 -18
openlit/instrumentation/together/together.py +18 -18
openlit/instrumentation/transformers/transformers.py +6 -6
openlit/instrumentation/vertexai/async_vertexai.py +53 -53
openlit/instrumentation/vertexai/vertexai.py +53 -53
openlit/instrumentation/vllm/vllm.py +6 -6
openlit/otel/metrics.py +98 -7
openlit/semcov/__init__.py +113 -80
{openlit-1.33.8.dist-info → openlit-1.33.9.dist-info}/METADATA +1 -1
openlit-1.33.9.dist-info/RECORD +121 -0
{openlit-1.33.8.dist-info → openlit-1.33.9.dist-info}/WHEEL +1 -1
openlit/instrumentation/openai/async_azure_openai.py +0 -900
openlit/instrumentation/openai/azure_openai.py +0 -898
openlit-1.33.8.dist-info/RECORD +0 -122
{openlit-1.33.8.dist-info → openlit-1.33.9.dist-info}/LICENSE +0 -0

openlit/instrumentation/google_ai_studio/google_ai_studio.py CHANGED Viewed

@@ -1,21 +1,24 @@
-# pylint: disable=duplicate-code, broad-exception-caught, too-many-statements, unused-argument, possibly-used-before-assignment, protected-access
 """
 Module for monitoring Google AI Studio API calls.
 """
 import logging
+import time
 from opentelemetry.trace import SpanKind, Status, StatusCode
-from opentelemetry.sdk.resources import TELEMETRY_SDK_NAME
+from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
 from openlit.__helpers import (
-    handle_exception,
     get_chat_model_cost,
+    handle_exception,
+    response_as_dict,
+    create_metrics_attributes,
+    set_server_address_and_port
 )
 from openlit.semcov import SemanticConvetion
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
-def generate(gen_ai_endpoint, version, environment, application_name,
+def generate(version, environment, application_name,
                      tracer, pricing_info, trace_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for chat to collect metrics.
@@ -35,230 +38,190 @@ def generate(gen_ai_endpoint, version, environment, application_name,
     def wrapper(wrapped, instance, args, kwargs):
         """
-        Wraps the 'chat' API call to add telemetry.
+        Wraps the 'chat.completions' API call to add telemetry.
         This collects metrics such as execution time, cost, and token usage, and handles errors
         gracefully, adding details to the trace for observability.
         Args:
-            wrapped: The original 'chat' method to be wrapped.
+            wrapped: The original 'chat.completions' method to be wrapped.
             instance: The instance of the class where the original method is defined.
-            args: Positional arguments for the 'chat' method.
-            kwargs: Keyword arguments for the 'chat' method.
+            args: Positional arguments for the 'chat.completions' method.
+            kwargs: Keyword arguments for the 'chat.completions' method.
         Returns:
-            The response from the original 'chat' method.
+            The response from the original 'chat.completions' method.
         """
-        # pylint: disable=no-else-return
-        if kwargs.get("stream", False) is True:
-            # Special handling for streaming response to accommodate the nature of data flow
-            def stream_generator():
-                with tracer.start_as_current_span(gen_ai_endpoint, kind= SpanKind.CLIENT) as span:
-                    # Placeholder for aggregating streaming response
-                    llmresponse = ""
-                    # Loop through streaming events capturing relevant details
-                    for chunk in wrapped(*args, **kwargs):
-                        # Collect message IDs and aggregated response from events
-                        content = chunk.text
-                        if content:
-                            llmresponse += content
-                        input_tokens = chunk.usage_metadata.prompt_token_count
-                        output_tokens = chunk.usage_metadata.candidates_token_count
-                        yield chunk
-                    # Handling exception ensure observability without disrupting operation
-                    try:
-                        prompt = ""
-                        for arg in args:
-                            if isinstance(arg, str):
-                                prompt = f"{prompt}{arg}\n"
-                            elif isinstance(arg, list):
-                                for subarg in arg:
-                                    prompt = f"{prompt}{subarg}\n"
-                        if hasattr(instance, "_model_id"):
-                            model = instance._model_id
-                        if hasattr(instance, "_model_name"):
-                            model = instance._model_name.replace("publishers/google/models/", "")
-                        if model.startswith("models/"):
-                            model = model[len("models/"):]
-                        total_tokens = input_tokens + output_tokens
-                        # Calculate cost of the operation
-                        cost = get_chat_model_cost(model,
-                                                    pricing_info, input_tokens,
-                                                    output_tokens)
-                        # Set Span attributes
-                        span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                        span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                            SemanticConvetion.GEN_AI_SYSTEM_GOOGLE_AI_STUDIO)
-                        span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                            SemanticConvetion.GEN_AI_TYPE_CHAT)
-                        span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
-                                            gen_ai_endpoint)
-                        span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
-                                            environment)
-                        span.set_attribute(SemanticConvetion.GEN_AI_APPLICATION_NAME,
-                                            application_name)
-                        span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
-                                            model)
-                        span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
-                                            True)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
-                                            input_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+        server_address, server_port = set_server_address_and_port(instance, "generativelanguage.googleapis.com", 443)
+        request_model = kwargs.get("model", "gemini-2.0-flash")
+        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
+            start_time = time.time()
+            response = wrapped(*args, **kwargs)
+            end_time = time.time()
+            response_dict = response_as_dict(response)
+            try:
+                # Format 'messages' into a single string
+                message_prompt = kwargs.get("contents", [])
+                formatted_messages = []
+                for content in message_prompt:
+                    role = content.role
+                    parts = content.parts
+                    content_str = []
+                    for part in parts:
+                        # Collect relevant fields and handle each type of data that Part could contain
+                        if part.text:
+                            content_str.append(f"text: {part.text}")
+                        if part.video_metadata:
+                            content_str.append(f"video_metadata: {part.video_metadata}")
+                        if part.thought:
+                            content_str.append(f"thought: {part.thought}")
+                        if part.code_execution_result:
+                            content_str.append(f"code_execution_result: {part.code_execution_result}")
+                        if part.executable_code:
+                            content_str.append(f"executable_code: {part.executable_code}")
+                        if part.file_data:
+                            content_str.append(f"file_data: {part.file_data}")
+                        if part.function_call:
+                            content_str.append(f"function_call: {part.function_call}")
+                        if part.function_response:
+                            content_str.append(f"function_response: {part.function_response}")
+                        if part.inline_data:
+                            content_str.append(f"inline_data: {part.inline_data}")
+                    formatted_messages.append(f"{role}: {', '.join(content_str)}")
+                prompt = "\n".join(formatted_messages)
+                input_tokens = response_dict.get('usage_metadata').get('prompt_token_count')
+                output_tokens = response_dict.get('usage_metadata').get('candidates_token_count')
+                # Calculate cost of the operation
+                cost = get_chat_model_cost(request_model,
+                                            pricing_info, input_tokens,
                                             output_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
-                                            total_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
-                                            cost)
-                        if trace_content:
-                            span.add_event(
-                                name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
-                                attributes={
-                                    SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
-                                },
-                            )
-                            span.add_event(
-                                name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
-                                attributes={
-                                    SemanticConvetion.GEN_AI_CONTENT_COMPLETION: llmresponse,
-                                },
-                            )
-                        span.set_status(Status(StatusCode.OK))
-                        if disable_metrics is False:
-                            attributes = {
-                                TELEMETRY_SDK_NAME:
-                                    "openlit",
-                                SemanticConvetion.GEN_AI_APPLICATION_NAME:
-                                    application_name,
-                                SemanticConvetion.GEN_AI_SYSTEM:
-                                    SemanticConvetion.GEN_AI_SYSTEM_GOOGLE_AI_STUDIO,
-                                SemanticConvetion.GEN_AI_ENVIRONMENT:
-                                    environment,
-                                SemanticConvetion.GEN_AI_TYPE:
-                                    SemanticConvetion.GEN_AI_TYPE_CHAT,
-                                SemanticConvetion.GEN_AI_REQUEST_MODEL:
-                                    model
-                            }
-                            metrics["genai_requests"].add(1, attributes)
-                            metrics["genai_total_tokens"].add(
-                                total_tokens, attributes
-                            )
-                            metrics["genai_completion_tokens"].add(output_tokens, attributes)
-                            metrics["genai_prompt_tokens"].add(input_tokens, attributes)
-                            metrics["genai_cost"].record(cost, attributes)
-                    except Exception as e:
-                        handle_exception(span, e)
-                        logger.error("Error in trace creation: %s", e)
-            return stream_generator()
-        else:
-            # pylint: disable=line-too-long
-            with tracer.start_as_current_span(gen_ai_endpoint, kind= SpanKind.CLIENT) as span:
-                response = wrapped(*args, **kwargs)
-                try:
-                    prompt = ""
-                    for arg in args:
-                        if isinstance(arg, str):
-                            prompt = f"{prompt}{arg}\n"
-                        elif isinstance(arg, list):
-                            for subarg in arg:
-                                prompt = f"{prompt}{subarg}\n"
-                    if hasattr(instance, "_model_id"):
-                        model = instance._model_id
-                    if hasattr(instance, "_model_name"):
-                        model = instance._model_name.replace("publishers/google/models/", "")
-                    if model.startswith("models/"):
-                        model = model[len("models/"):]
-                    # Set base span attribues
-                    span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_GOOGLE_AI_STUDIO)
-                    span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                        SemanticConvetion.GEN_AI_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
-                                        gen_ai_endpoint)
-                    span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
-                                        environment)
-                    span.set_attribute(SemanticConvetion.GEN_AI_APPLICATION_NAME,
-                                        application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
-                                        model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
-                                        False)
-                    if trace_content:
-                        span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
-                            attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
-                            },
-                        )
-                        span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
-                            attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
-                            },
-                        )
-                    prompt_tokens = response.usage_metadata.prompt_token_count
-                    completion_tokens = response.usage_metadata.candidates_token_count
-                    total_tokens = response.usage_metadata.total_token_count
-                    # Calculate cost of the operation
-                    cost = get_chat_model_cost(model,
-                                                pricing_info, prompt_tokens, completion_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
-                                        prompt_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
-                                        completion_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
-                                        total_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
-                                        cost)
-                    span.set_status(Status(StatusCode.OK))
-                    if disable_metrics is False:
-                        attributes = {
-                            TELEMETRY_SDK_NAME:
-                                "openlit",
-                            SemanticConvetion.GEN_AI_APPLICATION_NAME:
-                                application_name,
-                            SemanticConvetion.GEN_AI_SYSTEM:
-                                SemanticConvetion.GEN_AI_SYSTEM_GOOGLE_AI_STUDIO,
-                            SemanticConvetion.GEN_AI_ENVIRONMENT:
-                                environment,
-                            SemanticConvetion.GEN_AI_TYPE:
-                                SemanticConvetion.GEN_AI_TYPE_CHAT,
-                            SemanticConvetion.GEN_AI_REQUEST_MODEL:
-                                model
-                        }
-                        metrics["genai_requests"].add(1, attributes)
-                        metrics["genai_total_tokens"].add(total_tokens, attributes)
-                        metrics["genai_completion_tokens"].add(completion_tokens, attributes)
-                        metrics["genai_prompt_tokens"].add(prompt_tokens, attributes)
-                        metrics["genai_cost"].record(cost, attributes)
-                    # Return original response
-                    return response
-                except Exception as e:
-                    handle_exception(span, e)
-                    logger.error("Error in trace creation: %s", e)
-                    # Return original response
-                    return response
+                # Set base span attribues (OTel Semconv)
+                span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
+                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
+                span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
+                                    SemanticConvetion.GEN_AI_SYSTEM_GEMINI)
+                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                                    request_model)
+                span.set_attribute(SemanticConvetion.SERVER_PORT,
+                                    server_port)
+                inference_config = kwargs.get('config', {})
+                # List of attributes and their config keys
+                attributes = [
+                    (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                    (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
+                    (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                    (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                    (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                    (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                    (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                ]
+                # Set each attribute if the corresponding value exists and is not None
+                for attribute, key in attributes:
+                    # Use getattr to get the attribute value from the object
+                    value = getattr(inference_config, key, None)
+                    if value is not None:
+                        span.set_attribute(attribute, value)
+                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                                    response_dict.get('model_version'))
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                                    input_tokens)
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                                    output_tokens)
+                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                                    server_address)
+                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                                    [str(response_dict.get('candidates')[0].get('finish_reason'))])
+                # Set base span attribues (Extras)
+                span.set_attribute(DEPLOYMENT_ENVIRONMENT,
+                                    environment)
+                span.set_attribute(SERVICE_NAME,
+                                    application_name)
+                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                                    False)
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                                    input_tokens + output_tokens)
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                                    cost)
+                span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                                    end_time - start_time)
+                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                                    version)
+                if trace_content:
+                    span.add_event(
+                        name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                        attributes={
+                            SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                        },
+                    )
+                    span.add_event(
+                        name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                        attributes={
+                            SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
+                        },
+                    )
+                    if isinstance(response_dict.get('text'), str):
+                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                                        "text")
+                    elif response_dict.get('text') is not None:
+                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                                        "json")
+                span.set_status(Status(StatusCode.OK))
+                if disable_metrics is False:
+                    attributes = create_metrics_attributes(
+                        service_name=application_name,
+                        deployment_environment=environment,
+                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
+                        system=SemanticConvetion.GEN_AI_SYSTEM_GEMINI,
+                        request_model=request_model,
+                        server_address=server_address,
+                        server_port=server_port,
+                        response_model=response_dict.get('model_version'),
+                    )
+                    metrics["genai_client_usage_tokens"].record(
+                        input_tokens + output_tokens, attributes
+                    )
+                    metrics["genai_client_operation_duration"].record(
+                        end_time - start_time, attributes
+                    )
+                    metrics["genai_server_ttft"].record(
+                        end_time - start_time, attributes
+                    )
+                    metrics["genai_requests"].add(1, attributes)
+                    metrics["genai_completion_tokens"].add(output_tokens, attributes)
+                    metrics["genai_prompt_tokens"].add(input_tokens, attributes)
+                    metrics["genai_cost"].record(cost, attributes)
+                # Return original response
+                return response
+            except Exception as e:
+                handle_exception(span, e)
+                logger.error("Error in trace creation: %s", e)
+                # Return original response
+                return response
     return wrapper

openlit/instrumentation/gpt4all/gpt4all.py CHANGED Viewed

@@ -84,8 +84,8 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                         span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
                         span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                             SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                        span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                            SemanticConvetion.GEN_AI_TYPE_CHAT)
+                        span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                            SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
                         span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
                                             gen_ai_endpoint)
                         span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
@@ -120,9 +120,9 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                                 },
                             )
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                         prompt_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
                                             completion_tokens)
                         span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                             total_tokens)
@@ -141,8 +141,8 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                                     SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
                                 SemanticConvetion.GEN_AI_ENVIRONMENT:
                                     environment,
-                                SemanticConvetion.GEN_AI_TYPE:
-                                    SemanticConvetion.GEN_AI_TYPE_CHAT,
+                                SemanticConvetion.GEN_AI_OPERATION:
+                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
                                 SemanticConvetion.GEN_AI_REQUEST_MODEL:
                                     model
                             }
@@ -180,8 +180,8 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
                     span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                         SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                    span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                        SemanticConvetion.GEN_AI_TYPE_CHAT)
+                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
                     span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
                                         gen_ai_endpoint)
                     span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
@@ -216,9 +216,9 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                             },
                         )
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                         prompt_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         completion_tokens)
                     span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                         total_tokens)
@@ -237,8 +237,8 @@ def generate(gen_ai_endpoint, version, environment, application_name,
                                 SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
                             SemanticConvetion.GEN_AI_ENVIRONMENT:
                                 environment,
-                            SemanticConvetion.GEN_AI_TYPE:
-                                SemanticConvetion.GEN_AI_TYPE_CHAT,
+                            SemanticConvetion.GEN_AI_OPERATION:
+                                SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
                             SemanticConvetion.GEN_AI_REQUEST_MODEL:
                                 model
                         }
@@ -312,8 +312,8 @@ def embed(gen_ai_endpoint, version, environment, application_name,
                 span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
                 span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                     SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                    SemanticConvetion.GEN_AI_TYPE_EMBEDDING)
+                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING)
                 span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
                                     gen_ai_endpoint)
                 span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
@@ -322,7 +322,7 @@ def embed(gen_ai_endpoint, version, environment, application_name,
                                     application_name)
                 span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
                                     model)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                     prompt_tokens)
                 span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                     prompt_tokens)
@@ -348,8 +348,8 @@ def embed(gen_ai_endpoint, version, environment, application_name,
                             SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
                         SemanticConvetion.GEN_AI_ENVIRONMENT:
                             environment,
-                        SemanticConvetion.GEN_AI_TYPE:
-                            SemanticConvetion.GEN_AI_TYPE_EMBEDDING,
+                        SemanticConvetion.GEN_AI_OPERATION:
+                            SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING,
                         SemanticConvetion.GEN_AI_REQUEST_MODEL:
                             model
                     }

openlit/instrumentation/groq/async_groq.py CHANGED Viewed

@@ -104,8 +104,8 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                         span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
                         span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                             SemanticConvetion.GEN_AI_SYSTEM_GROQ)
-                        span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                            SemanticConvetion.GEN_AI_TYPE_CHAT)
+                        span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                            SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
                         span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
                                             gen_ai_endpoint)
                         span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_ID,
@@ -132,9 +132,9 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                                             kwargs.get("seed", ""))
                         span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
                                             True)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                             prompt_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
                                             completion_tokens)
                         span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                             prompt_tokens + completion_tokens)
@@ -166,8 +166,8 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                                     SemanticConvetion.GEN_AI_SYSTEM_GROQ,
                                 SemanticConvetion.GEN_AI_ENVIRONMENT:
                                     environment,
-                                SemanticConvetion.GEN_AI_TYPE:
-                                    SemanticConvetion.GEN_AI_TYPE_CHAT,
+                                SemanticConvetion.GEN_AI_OPERATION:
+                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
                                 SemanticConvetion.GEN_AI_REQUEST_MODEL:
                                     kwargs.get("model", "gpt-3.5-turbo")
                             }
@@ -216,8 +216,8 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
                     span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                         SemanticConvetion.GEN_AI_SYSTEM_GROQ)
-                    span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                        SemanticConvetion.GEN_AI_TYPE_CHAT)
+                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
                     span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
                                         gen_ai_endpoint)
                     span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_ID,
@@ -259,9 +259,9 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                                                     pricing_info, response.usage.prompt_tokens,
                                                     response.usage.completion_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                             response.usage.prompt_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
                                             response.usage.completion_tokens)
                         span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                             response.usage.total_tokens)
@@ -305,9 +305,9 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                         span.set_attribute(SemanticConvetion.GEN_AI_CONTENT_COMPLETION,
                                             "Function called with tools")
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
                                             response.usage.prompt_tokens)
-                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
+                        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
                                             response.usage.completion_tokens)
                         span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
                                             response.usage.total_tokens)
@@ -326,8 +326,8 @@ def async_chat(gen_ai_endpoint, version, environment, application_name,
                                 SemanticConvetion.GEN_AI_SYSTEM_GROQ,
                             SemanticConvetion.GEN_AI_ENVIRONMENT:
                                 environment,
-                            SemanticConvetion.GEN_AI_TYPE:
-                                SemanticConvetion.GEN_AI_TYPE_CHAT,
+                            SemanticConvetion.GEN_AI_OPERATION:
+                                SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
                             SemanticConvetion.GEN_AI_REQUEST_MODEL:
                                 kwargs.get("model", "gpt-3.5-turbo")
                         }

openlit 1.33.8__py3-none-any.whl → 1.33.9__py3-none-any.whl

openlit 1.33.8py3-none-any.whl → 1.33.9py3-none-any.whl