PyPI - openlit - Versions diffs - 1.33.9__py3-none-any.whl → 1.33.11__py3-none-any.whl - Mend

openlit 1.33.9py3-none-any.whl → 1.33.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

openlit/__helpers.py +78 -0
openlit/__init__.py +41 -13
openlit/instrumentation/ag2/__init__.py +9 -10
openlit/instrumentation/ag2/ag2.py +134 -69
openlit/instrumentation/ai21/__init__.py +6 -5
openlit/instrumentation/ai21/ai21.py +71 -534
openlit/instrumentation/ai21/async_ai21.py +71 -534
openlit/instrumentation/ai21/utils.py +407 -0
openlit/instrumentation/anthropic/__init__.py +3 -3
openlit/instrumentation/anthropic/anthropic.py +5 -5
openlit/instrumentation/anthropic/async_anthropic.py +5 -5
openlit/instrumentation/assemblyai/__init__.py +2 -2
openlit/instrumentation/assemblyai/assemblyai.py +3 -3
openlit/instrumentation/astra/__init__.py +25 -25
openlit/instrumentation/astra/astra.py +7 -7
openlit/instrumentation/astra/async_astra.py +7 -7
openlit/instrumentation/azure_ai_inference/__init__.py +5 -5
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +11 -11
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +11 -11
openlit/instrumentation/bedrock/__init__.py +2 -2
openlit/instrumentation/bedrock/bedrock.py +3 -3
openlit/instrumentation/chroma/__init__.py +9 -9
openlit/instrumentation/chroma/chroma.py +7 -7
openlit/instrumentation/cohere/__init__.py +7 -7
openlit/instrumentation/cohere/async_cohere.py +10 -10
openlit/instrumentation/cohere/cohere.py +11 -11
openlit/instrumentation/controlflow/__init__.py +4 -4
openlit/instrumentation/controlflow/controlflow.py +5 -5
openlit/instrumentation/crawl4ai/__init__.py +3 -3
openlit/instrumentation/crawl4ai/async_crawl4ai.py +5 -5
openlit/instrumentation/crawl4ai/crawl4ai.py +5 -5
openlit/instrumentation/crewai/__init__.py +3 -3
openlit/instrumentation/crewai/crewai.py +6 -4
openlit/instrumentation/dynamiq/__init__.py +5 -5
openlit/instrumentation/dynamiq/dynamiq.py +5 -5
openlit/instrumentation/elevenlabs/__init__.py +5 -5
openlit/instrumentation/elevenlabs/async_elevenlabs.py +4 -5
openlit/instrumentation/elevenlabs/elevenlabs.py +4 -5
openlit/instrumentation/embedchain/__init__.py +2 -2
openlit/instrumentation/embedchain/embedchain.py +9 -9
openlit/instrumentation/firecrawl/__init__.py +3 -3
openlit/instrumentation/firecrawl/firecrawl.py +5 -5
openlit/instrumentation/google_ai_studio/__init__.py +3 -3
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +3 -3
openlit/instrumentation/google_ai_studio/google_ai_studio.py +3 -3
openlit/instrumentation/gpt4all/__init__.py +5 -5
openlit/instrumentation/gpt4all/gpt4all.py +350 -225
openlit/instrumentation/gpu/__init__.py +5 -5
openlit/instrumentation/groq/__init__.py +5 -5
openlit/instrumentation/groq/async_groq.py +359 -243
openlit/instrumentation/groq/groq.py +359 -243
openlit/instrumentation/haystack/__init__.py +2 -2
openlit/instrumentation/haystack/haystack.py +5 -5
openlit/instrumentation/julep/__init__.py +7 -7
openlit/instrumentation/julep/async_julep.py +6 -6
openlit/instrumentation/julep/julep.py +6 -6
openlit/instrumentation/langchain/__init__.py +15 -9
openlit/instrumentation/langchain/async_langchain.py +388 -0
openlit/instrumentation/langchain/langchain.py +110 -497
openlit/instrumentation/letta/__init__.py +7 -7
openlit/instrumentation/letta/letta.py +10 -8
openlit/instrumentation/litellm/__init__.py +9 -10
openlit/instrumentation/litellm/async_litellm.py +321 -250
openlit/instrumentation/litellm/litellm.py +319 -248
openlit/instrumentation/llamaindex/__init__.py +2 -2
openlit/instrumentation/llamaindex/llamaindex.py +5 -5
openlit/instrumentation/mem0/__init__.py +2 -2
openlit/instrumentation/mem0/mem0.py +5 -5
openlit/instrumentation/milvus/__init__.py +2 -2
openlit/instrumentation/milvus/milvus.py +7 -7
openlit/instrumentation/mistral/__init__.py +13 -13
openlit/instrumentation/mistral/async_mistral.py +426 -253
openlit/instrumentation/mistral/mistral.py +424 -250
openlit/instrumentation/multion/__init__.py +7 -7
openlit/instrumentation/multion/async_multion.py +9 -7
openlit/instrumentation/multion/multion.py +9 -7
openlit/instrumentation/ollama/__init__.py +19 -39
openlit/instrumentation/ollama/async_ollama.py +137 -563
openlit/instrumentation/ollama/ollama.py +136 -563
openlit/instrumentation/ollama/utils.py +333 -0
openlit/instrumentation/openai/__init__.py +11 -11
openlit/instrumentation/openai/async_openai.py +25 -27
openlit/instrumentation/openai/openai.py +25 -27
openlit/instrumentation/phidata/__init__.py +2 -2
openlit/instrumentation/phidata/phidata.py +6 -4
openlit/instrumentation/pinecone/__init__.py +6 -6
openlit/instrumentation/pinecone/pinecone.py +7 -7
openlit/instrumentation/premai/__init__.py +5 -5
openlit/instrumentation/premai/premai.py +268 -219
openlit/instrumentation/qdrant/__init__.py +2 -2
openlit/instrumentation/qdrant/async_qdrant.py +7 -7
openlit/instrumentation/qdrant/qdrant.py +7 -7
openlit/instrumentation/reka/__init__.py +5 -5
openlit/instrumentation/reka/async_reka.py +93 -55
openlit/instrumentation/reka/reka.py +93 -55
openlit/instrumentation/together/__init__.py +9 -9
openlit/instrumentation/together/async_together.py +284 -242
openlit/instrumentation/together/together.py +284 -242
openlit/instrumentation/transformers/__init__.py +3 -3
openlit/instrumentation/transformers/transformers.py +79 -48
openlit/instrumentation/vertexai/__init__.py +19 -69
openlit/instrumentation/vertexai/async_vertexai.py +333 -990
openlit/instrumentation/vertexai/vertexai.py +333 -990
openlit/instrumentation/vllm/__init__.py +3 -3
openlit/instrumentation/vllm/vllm.py +65 -35
openlit/otel/events.py +85 -0
openlit/otel/tracing.py +3 -13
openlit/semcov/__init__.py +16 -4
{openlit-1.33.9.dist-info → openlit-1.33.11.dist-info}/METADATA +2 -2
openlit-1.33.11.dist-info/RECORD +125 -0
openlit-1.33.9.dist-info/RECORD +0 -121
{openlit-1.33.9.dist-info → openlit-1.33.11.dist-info}/LICENSE +0 -0
{openlit-1.33.9.dist-info → openlit-1.33.11.dist-info}/WHEEL +0 -0

openlit/instrumentation/ollama/utils.py ADDED Viewed

@@ -0,0 +1,333 @@
+"""
+Ollama OpenTelemetry instrumentation utility functions
+"""
+import time
+from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from opentelemetry.trace import Status, StatusCode
+from openlit.__helpers import (
+    calculate_ttft,
+    response_as_dict,
+    calculate_tbt,
+    general_tokens,
+    extract_and_format_input,
+    get_chat_model_cost,
+    get_embed_model_cost,
+    handle_exception,
+    create_metrics_attributes,
+    otel_event,
+    concatenate_all_contents
+)
+from openlit.semcov import SemanticConvetion
+def process_chunk(self, chunk):
+    """
+    Process a chunk of response data and update state.
+    """
+    end_time = time.time()
+    # Record the timestamp for the current chunk
+    self._timestamps.append(end_time)
+    if len(self._timestamps) == 1:
+        # Calculate time to first chunk
+        self._ttft = calculate_ttft(self._timestamps, self._start_time)
+    chunked = response_as_dict(chunk)
+    self._llmresponse += chunked.get('message', {}).get('content', '')
+    if chunked.get('message', {}).get('tool_calls'):
+        self._tool_calls = chunked['message']['tool_calls']
+    if chunked.get('eval_count'):
+        self._response_role = chunked.get('message', {}).get('role', '')
+        self._input_tokens = chunked.get('prompt_eval_count', 0)
+        self._output_tokens = chunked.get('eval_count', 0)
+        self._response_model = chunked.get('model', '')
+        self._finish_reason = chunked.get('done_reason', '')
+def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
+                        event_provider, capture_message_content, disable_metrics, version, is_stream):
+    """
+    Process chat request and generate Telemetry
+    """
+    scope._end_time = time.time()
+    if len(scope._timestamps) > 1:
+        scope._tbt = calculate_tbt(scope._timestamps)
+    formatted_messages = extract_and_format_input(scope._kwargs.get("messages", ""))
+    request_model = scope._kwargs.get("model", "gpt-4o")
+    cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
+    # Set Span attributes (OTel Semconv)
+    scope._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION, SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM, SemanticConvetion.GEN_AI_SYSTEM_OLLAMA)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL, request_model)
+    scope._span.set_attribute(SemanticConvetion.SERVER_PORT, scope._server_port)
+    options = scope._kwargs.get('options', {})
+    attributes = [
+        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'repeat_penalty'),
+        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
+        (SemanticConvetion.GEN_AI_REQUEST_SEED, 'seed'),
+        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop'),
+        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
+        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+    ]
+    for attribute, key in attributes:
+        value = options.get(key)
+        if value is not None:
+            scope._span.set_attribute(attribute, value)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL, scope._response_model)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
+    scope._span.set_attribute(SemanticConvetion.SERVER_ADDRESS, scope._server_address)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                              "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(DEPLOYMENT_ENVIRONMENT, environment)
+    scope._span.set_attribute(SERVICE_NAME, application_name)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM, is_stream)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST, cost)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT, scope._tbt)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT, scope._ttft)
+    scope._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION, version)
+    # To be removed one the change to log events (from span events) is complete
+    prompt = concatenate_all_contents(formatted_messages)
+    if capture_message_content:
+        scope._span.add_event(
+            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+            attributes={
+                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+            },
+        )
+        scope._span.add_event(
+            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+            attributes={
+                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: scope._llmresponse,
+            },
+        )
+    choice_event_body = {
+        "finish_reason": scope._finish_reason,
+        "index": 0,
+        "message": {
+            **({"content": scope._llmresponse} if capture_message_content else {}),
+            "role": scope._response_role
+        }
+    }
+    if scope._tool_calls:
+        print(scope._tool_calls)
+        function_call = scope._tool_calls[0]
+        choice_event_body["message"].update({
+            "tool_calls": {
+                "function": {
+                    "name": function_call.get('function', {}).get('name', ''),
+                    "arguments": function_call.get('function', {}).get('arguments', '')
+                },
+                "id": function_call.get('id', ''),
+                "type": "function"
+            }
+        })
+    # Emit events
+    for role in ['user', 'system', 'assistant', 'tool']:
+        if formatted_messages.get(role, {}).get('content', ''):
+            event = otel_event(
+                name=getattr(SemanticConvetion, f'GEN_AI_{role.upper()}_MESSAGE'),
+                attributes={
+                    SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+                },
+                body = {
+                    # pylint: disable=line-too-long
+                    **({"content": formatted_messages.get(role, {}).get('content', '')} if capture_message_content else {}),
+                    "role": formatted_messages.get(role, {}).get('role', []),
+                    **({
+                        "tool_calls": {
+                            "function": {
+                                # pylint: disable=line-too-long
+                                "name": (scope._tool_calls[0].get('function', {}).get('name', '') if scope._tool_calls else ''),
+                                "arguments": (scope._tool_calls[0].get('function', {}).get('arguments', '') if scope._tool_calls else '')
+                            },
+                            "id": (scope._tool_calls[0].get('id', '') if scope._tool_calls else ''),
+                            "type": "function"
+                        }
+                    } if role == 'assistant' else {}),
+                    **({
+                        "id": (scope._tool_calls[0].get('id', '') if scope._tool_calls else '')
+                    } if role == 'tool' else {})
+                }
+            )
+            event_provider.emit(event)
+    choice_event = otel_event(
+        name=SemanticConvetion.GEN_AI_CHOICE,
+        attributes={
+            SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+        },
+        body=choice_event_body
+    )
+    event_provider.emit(choice_event)
+    scope._span.set_status(Status(StatusCode.OK))
+    if not disable_metrics:
+        metrics_attributes = create_metrics_attributes(
+            service_name=application_name,
+            deployment_environment=environment,
+            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
+            system=SemanticConvetion.GEN_AI_SYSTEM_OLLAMA,
+            request_model=request_model,
+            server_address=scope._server_address,
+            server_port=scope._server_port,
+            response_model=scope._response_model,
+        )
+        metrics["genai_client_usage_tokens"].record(scope._input_tokens + scope._output_tokens, metrics_attributes)
+        metrics["genai_client_operation_duration"].record(scope._end_time - scope._start_time, metrics_attributes)
+        metrics["genai_server_tbt"].record(scope._tbt, metrics_attributes)
+        metrics["genai_server_ttft"].record(scope._ttft, metrics_attributes)
+        metrics["genai_requests"].add(1, metrics_attributes)
+        metrics["genai_completion_tokens"].add(scope._output_tokens, metrics_attributes)
+        metrics["genai_prompt_tokens"].add(scope._input_tokens, metrics_attributes)
+        metrics["genai_cost"].record(cost, metrics_attributes)
+def process_streaming_chat_response(self, pricing_info, environment, application_name, metrics,
+                                    event_provider, capture_message_content=False, disable_metrics=False, version=''):
+    """
+    Process chat request and generate Telemetry
+    """
+    common_chat_logic(self, pricing_info, environment, application_name, metrics,
+                        event_provider, capture_message_content, disable_metrics, version, is_stream=True)
+def process_chat_response(response, request_model, pricing_info, server_port, server_address,
+                          environment, application_name, metrics, event_provider, start_time,
+                          span, capture_message_content=False, disable_metrics=False, version="1.0.0", **kwargs):
+    """
+    Process chat request and generate Telemetry
+    """
+    self = type('GenericScope', (), {})()
+    # pylint: disable = no-member
+    self._start_time = start_time
+    self._end_time = time.time()
+    self._span = span
+    self._llmresponse = response.get('message', {}).get('content', '')
+    self._response_role = response.get('message', {}).get('role', 'assistant')
+    self._input_tokens = response.get('prompt_eval_count')
+    self._output_tokens = response.get('eval_count')
+    self._response_model = response.get('model', '')
+    self._finish_reason = response.get('done_reason', '')
+    self._timestamps = []
+    self._ttft, self._tbt = self._end_time - self._start_time, 0
+    self._server_address, self._server_port = server_address, server_port
+    self._kwargs = kwargs
+    self._tool_calls = response.get('message', {}).get('tool_calls', [])
+    common_chat_logic(self, pricing_info, environment, application_name, metrics,
+                        event_provider, capture_message_content, disable_metrics, version, is_stream=False)
+    return response
+def process_embedding_response(response, request_model, pricing_info, server_port, server_address,
+        environment, application_name, metrics, event_provider,
+        start_time, span, capture_message_content=False, disable_metrics=False, version="1.0.0", **kwargs):
+    """
+    Process embedding request and generate Telemetry
+    """
+    end_time = time.time()
+    try:
+        input_tokens = general_tokens(str(kwargs.get('prompt')))
+        # Calculate cost of the operation
+        cost = get_embed_model_cost(request_model,
+                            pricing_info, input_tokens)
+        # Set Span attributes (OTel Semconv)
+        span.set_attribute(TELEMETRY_SDK_NAME, 'openlit')
+        span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                            SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING)
+        span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
+                            SemanticConvetion.GEN_AI_SYSTEM_OLLAMA)
+        span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                            request_model)
+        span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                            request_model)
+        span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                            server_address)
+        span.set_attribute(SemanticConvetion.SERVER_PORT,
+                            server_port)
+        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                            input_tokens)
+        # Set Span attributes (Extras)
+        span.set_attribute(DEPLOYMENT_ENVIRONMENT,
+                            environment)
+        span.set_attribute(SERVICE_NAME,
+                            application_name)
+        span.set_attribute(SemanticConvetion.GEN_AI_CLIENT_TOKEN_USAGE,
+                            input_tokens)
+        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                            cost)
+        span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                            version)
+        prompt_event = otel_event(
+            name=SemanticConvetion.GEN_AI_USER_MESSAGE,
+            attributes={
+                SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+            },
+            body={
+                **({"content": kwargs.get('prompt', '')} if capture_message_content else {}),
+                "role":  'user'
+            }
+        )
+        event_provider.emit(prompt_event)
+        span.set_status(Status(StatusCode.OK))
+        if disable_metrics is False:
+            attributes = create_metrics_attributes(
+                service_name=application_name,
+                deployment_environment=environment,
+                operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING,
+                system=SemanticConvetion.GEN_AI_SYSTEM_OLLAMA,
+                request_model=request_model,
+                server_address=server_address,
+                server_port=server_port,
+                response_model=request_model,
+            )
+            metrics['genai_client_usage_tokens'].record(
+                    input_tokens, attributes
+                )
+            metrics['genai_client_operation_duration'].record(
+                end_time - start_time, attributes
+            )
+            metrics['genai_requests'].add(1, attributes)
+            metrics['genai_prompt_tokens'].add(input_tokens, attributes)
+            metrics['genai_cost'].record(cost, attributes)
+        # Return original response
+        return response
+    except Exception as e:
+        handle_exception(span, e)
+        # Return original response
+        return response

openlit/instrumentation/openai/__init__.py CHANGED Viewed

@@ -25,7 +25,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
         tracer = kwargs.get("tracer")
         metrics = kwargs.get("metrics_dict")
         pricing_info = kwargs.get("pricing_info")
-        trace_content = kwargs.get("trace_content")
+        capture_message_content = kwargs.get("capture_message_content")
         disable_metrics = kwargs.get("disable_metrics")
         version = importlib.metadata.version("openai")
@@ -33,7 +33,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.chat.completions",
             "Completions.create",
             chat_completions(version, environment, application_name,
-                         tracer, pricing_info, trace_content,
+                         tracer, pricing_info, capture_message_content,
                          metrics, disable_metrics),
         )
@@ -41,7 +41,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.chat.completions",
             "AsyncCompletions.create",
             async_chat_completions(version, environment, application_name,
-                               tracer, pricing_info, trace_content,
+                               tracer, pricing_info, capture_message_content,
                                metrics, disable_metrics),
         )
@@ -49,7 +49,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.images",
             "Images.generate",
             image_generate(version, environment, application_name,
-                                   tracer, pricing_info, trace_content,
+                                   tracer, pricing_info, capture_message_content,
                                    metrics, disable_metrics),
         )
@@ -57,7 +57,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.images",
             "AsyncImages.generate",
             async_image_generate(version, environment, application_name,
-                                         tracer, pricing_info, trace_content,
+                                         tracer, pricing_info, capture_message_content,
                                          metrics, disable_metrics),
         )
@@ -65,7 +65,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.embeddings",
             "Embeddings.create",
             embedding(version, environment, application_name,
-                              tracer, pricing_info, trace_content,
+                              tracer, pricing_info, capture_message_content,
                               metrics, disable_metrics),
         )
@@ -73,7 +73,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.embeddings",
             "AsyncEmbeddings.create",
             async_embedding(version, environment, application_name,
-                                    tracer, pricing_info, trace_content,
+                                    tracer, pricing_info, capture_message_content,
                                     metrics, disable_metrics),
         )
@@ -82,7 +82,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "Images.create_variation",
             image_variatons(version,
                             environment, application_name,
-                            tracer, pricing_info, trace_content,
+                            tracer, pricing_info, capture_message_content,
                             metrics, disable_metrics),
         )
@@ -91,7 +91,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "AsyncImages.create_variation",
             async_image_variatons(version,
                                   environment, application_name,
-                                  tracer, pricing_info, trace_content,
+                                  tracer, pricing_info, capture_message_content,
                                   metrics, disable_metrics),
         )
@@ -99,7 +99,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.audio.speech",
             "Speech.create",
             audio_create(version, environment, application_name,
-                         tracer, pricing_info, trace_content,
+                         tracer, pricing_info, capture_message_content,
                          metrics, disable_metrics),
         )
@@ -107,7 +107,7 @@ class OpenAIInstrumentor(BaseInstrumentor):
             "openai.resources.audio.speech",
             "AsyncSpeech.create",
             async_audio_create(version, environment, application_name,
-                               tracer, pricing_info, trace_content,
+                               tracer, pricing_info, capture_message_content,
                                metrics, disable_metrics),
         )

openlit/instrumentation/openai/async_openai.py CHANGED Viewed

@@ -25,7 +25,7 @@ from openlit.semcov import SemanticConvetion
 logger = logging.getLogger(__name__)
 def async_chat_completions(version, environment, application_name,
-                           tracer, pricing_info, trace_content, metrics, disable_metrics):
+                           tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for chat completions to collect metrics.
@@ -35,7 +35,7 @@ def async_chat_completions(version, environment, application_name,
         application_name: Name of the application using the OpenAI API.
         tracer: OpenTelemetry tracer for creating spans.
         pricing_info: Information used for calculating the cost of OpenAI usage.
-        trace_content: Flag indicating whether to trace the actual content.
+        capture_message_content: Flag indicating whether to trace the actual content.
     Returns:
         A function that wraps the chat completions method to add telemetry.
@@ -44,7 +44,7 @@ def async_chat_completions(version, environment, application_name,
     class TracedAsyncStream:
         """
         Wrapper for streaming responses to collect metrics and trace data.
-        Wraps the 'openai.AsyncStream' response to collect message IDs and aggregated response.
+        Wraps the response to collect message IDs and aggregated response.
         This class implements the '__aiter__' and '__anext__' methods that
         handle asynchronous streaming responses.
@@ -197,11 +197,11 @@ def async_chat_completions(version, environment, application_name,
                                         output_tokens)
                     self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
                                         self._server_address)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_REQUEST_SERVICE_TIER,
+                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_SERVICE_TIER,
                                         self._kwargs.get("service_tier", "auto"))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_RESPONSE_SERVICE_TIER,
+                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_SERVICE_TIER,
                                         self._openai_response_service_tier)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_RESPONSE_SYSTEM_FINGERPRINT,
+                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT,
                                         self._openai_system_fingerprint)
                     if isinstance(self._llmresponse, str):
                         self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
@@ -229,7 +229,7 @@ def async_chat_completions(version, environment, application_name,
                                         self._ttft)
                     self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                         version)
-                    if trace_content:
+                    if capture_message_content:
                         self._span.add_event(
                             name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
@@ -382,12 +382,12 @@ def async_chat_completions(version, environment, application_name,
                                         output_tokens)
                     span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
                                         server_address)
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_REQUEST_SERVICE_TIER,
+                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_SERVICE_TIER,
                                         kwargs.get("service_tier", "auto"))
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_RESPONSE_SERVICE_TIER,
+                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_SERVICE_TIER,
                                         response_dict.get('service_tier'))
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPENAI_RESPONSE_SYSTEM_FINGERPRINT,
-                                        response_dict.get('system_fingerprint'))
+                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT,
+                                        response_dict.get('system_fingerprint', ''))
                     # Set base span attribues (Extras)
                     span.set_attribute(DEPLOYMENT_ENVIRONMENT,
@@ -406,7 +406,7 @@ def async_chat_completions(version, environment, application_name,
                                         end_time - start_time)
                     span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                         version)
-                    if trace_content:
+                    if capture_message_content:
                         span.add_event(
                             name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
@@ -417,7 +417,7 @@ def async_chat_completions(version, environment, application_name,
                     for i in range(kwargs.get('n',1)):
                         span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
                                            [response_dict.get('choices')[i].get('finish_reason')])
-                        if trace_content:
+                        if capture_message_content:
                             span.add_event(
                                 name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
                                 attributes={
@@ -477,7 +477,7 @@ def async_chat_completions(version, environment, application_name,
     return wrapper
 def async_embedding(version, environment, application_name,
-              tracer, pricing_info, trace_content, metrics, disable_metrics):
+              tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for embeddings to collect metrics.
@@ -487,7 +487,7 @@ def async_embedding(version, environment, application_name,
         application_name: Name of the application using the OpenAI API.
         tracer: OpenTelemetry tracer for creating spans.
         pricing_info: Information used for calculating the cost of OpenAI usage.
-        trace_content: Flag indicating whether to trace the actual content.
+        capture_message_content: Flag indicating whether to trace the actual content.
     Returns:
         A function that wraps the embeddings method to add telemetry.
@@ -561,7 +561,7 @@ def async_embedding(version, environment, application_name,
                 span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                     version)
-                if trace_content:
+                if capture_message_content:
                     span.add_event(
                         name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
                         attributes={
@@ -605,7 +605,7 @@ def async_embedding(version, environment, application_name,
     return wrapper
 def async_image_generate(version, environment, application_name,
-                   tracer, pricing_info, trace_content, metrics, disable_metrics):
+                   tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for image generation to collect metrics.
@@ -615,7 +615,7 @@ def async_image_generate(version, environment, application_name,
         application_name: Name of the application using the OpenAI API.
         tracer: OpenTelemetry tracer for creating spans.
         pricing_info: Information used for calculating the cost of OpenAI image generation.
-        trace_content: Flag indicating whether to trace the input prompt and generated images.
+        capture_message_content: Flag indicating whether to trace the input prompt and generated images.
     Returns:
         A function that wraps the image generation method to add telemetry.
@@ -657,8 +657,6 @@ def async_image_generate(version, environment, application_name,
                 else:
                     image = "url"
-                request_model = kwargs.get("model", "dall-e-2")
                 # Calculate cost of the operation
                 cost = get_image_model_cost(request_model,
                                             pricing_info, kwargs.get("size", "1024x1024"),
@@ -702,7 +700,7 @@ def async_image_generate(version, environment, application_name,
                     span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                         version)
-                    if trace_content:
+                    if capture_message_content:
                         span.add_event(
                             name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
@@ -754,7 +752,7 @@ def async_image_generate(version, environment, application_name,
     return wrapper
 def async_image_variatons(version, environment, application_name,
-                    tracer, pricing_info, trace_content, metrics, disable_metrics):
+                    tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for creating image variations to collect metrics.
@@ -764,7 +762,7 @@ def async_image_variatons(version, environment, application_name,
         application_name: Name of the application using the OpenAI API.
         tracer: OpenTelemetry tracer for creating spans.
         pricing_info: Information used for calculating the cost of generating image variations.
-        trace_content: Flag indicating whether to trace the input image and generated variations.
+        capture_message_content: Flag indicating whether to trace the input image and generated variations.
     Returns:
         A function that wraps the image variations creation method to add telemetry.
@@ -844,7 +842,7 @@ def async_image_variatons(version, environment, application_name,
                     span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                         version)
-                    if trace_content:
+                    if capture_message_content:
                         attribute_name = f"{SemanticConvetion.GEN_AI_RESPONSE_IMAGE}.{images_count}"
                         span.add_event(
                             name=attribute_name,
@@ -890,7 +888,7 @@ def async_image_variatons(version, environment, application_name,
     return wrapper
 def async_audio_create(version, environment, application_name,
-                 tracer, pricing_info, trace_content, metrics, disable_metrics):
+                 tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
     Generates a telemetry wrapper for creating speech audio to collect metrics.
@@ -900,7 +898,7 @@ def async_audio_create(version, environment, application_name,
         application_name: Name of the application using the OpenAI API.
         tracer: OpenTelemetry tracer for creating spans.
         pricing_info: Information used for calculating the cost of generating speech audio.
-        trace_content: Flag indicating whether to trace the input text and generated audio.
+        capture_message_content: Flag indicating whether to trace the input text and generated audio.
     Returns:
         A function that wraps the speech audio creation method to add telemetry.
@@ -969,7 +967,7 @@ def async_audio_create(version, environment, application_name,
                                     cost)
                 span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
                                     version)
-                if trace_content:
+                if capture_message_content:
                     span.add_event(
                         name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
                         attributes={

openlit 1.33.9__py3-none-any.whl → 1.33.11__py3-none-any.whl

openlit 1.33.9py3-none-any.whl → 1.33.11py3-none-any.whl