PyPI - openlit - Versions diffs - 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl - Mend

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

openlit/__helpers.py +235 -86
openlit/__init__.py +16 -13
openlit/_instrumentors.py +2 -1
openlit/evals/all.py +50 -21
openlit/evals/bias_detection.py +47 -20
openlit/evals/hallucination.py +53 -22
openlit/evals/toxicity.py +50 -21
openlit/evals/utils.py +54 -30
openlit/guard/all.py +61 -19
openlit/guard/prompt_injection.py +34 -14
openlit/guard/restrict_topic.py +46 -15
openlit/guard/sensitive_topic.py +34 -14
openlit/guard/utils.py +58 -22
openlit/instrumentation/ag2/__init__.py +24 -8
openlit/instrumentation/ag2/ag2.py +34 -13
openlit/instrumentation/ag2/async_ag2.py +34 -13
openlit/instrumentation/ag2/utils.py +133 -30
openlit/instrumentation/ai21/__init__.py +43 -14
openlit/instrumentation/ai21/ai21.py +47 -21
openlit/instrumentation/ai21/async_ai21.py +47 -21
openlit/instrumentation/ai21/utils.py +299 -78
openlit/instrumentation/anthropic/__init__.py +21 -4
openlit/instrumentation/anthropic/anthropic.py +28 -17
openlit/instrumentation/anthropic/async_anthropic.py +28 -17
openlit/instrumentation/anthropic/utils.py +145 -35
openlit/instrumentation/assemblyai/__init__.py +11 -2
openlit/instrumentation/assemblyai/assemblyai.py +15 -4
openlit/instrumentation/assemblyai/utils.py +120 -25
openlit/instrumentation/astra/__init__.py +43 -10
openlit/instrumentation/astra/astra.py +28 -5
openlit/instrumentation/astra/async_astra.py +28 -5
openlit/instrumentation/astra/utils.py +151 -55
openlit/instrumentation/azure_ai_inference/__init__.py +43 -10
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +53 -21
openlit/instrumentation/azure_ai_inference/utils.py +307 -83
openlit/instrumentation/bedrock/__init__.py +21 -4
openlit/instrumentation/bedrock/bedrock.py +63 -25
openlit/instrumentation/bedrock/utils.py +139 -30
openlit/instrumentation/chroma/__init__.py +89 -16
openlit/instrumentation/chroma/chroma.py +28 -6
openlit/instrumentation/chroma/utils.py +167 -51
openlit/instrumentation/cohere/__init__.py +63 -18
openlit/instrumentation/cohere/async_cohere.py +63 -24
openlit/instrumentation/cohere/cohere.py +63 -24
openlit/instrumentation/cohere/utils.py +286 -73
openlit/instrumentation/controlflow/__init__.py +35 -9
openlit/instrumentation/controlflow/controlflow.py +66 -33
openlit/instrumentation/crawl4ai/__init__.py +25 -10
openlit/instrumentation/crawl4ai/async_crawl4ai.py +78 -31
openlit/instrumentation/crawl4ai/crawl4ai.py +78 -31
openlit/instrumentation/crewai/__init__.py +40 -15
openlit/instrumentation/crewai/async_crewai.py +32 -7
openlit/instrumentation/crewai/crewai.py +32 -7
openlit/instrumentation/crewai/utils.py +159 -56
openlit/instrumentation/dynamiq/__init__.py +46 -12
openlit/instrumentation/dynamiq/dynamiq.py +74 -33
openlit/instrumentation/elevenlabs/__init__.py +23 -4
openlit/instrumentation/elevenlabs/async_elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/elevenlabs.py +16 -4
openlit/instrumentation/elevenlabs/utils.py +128 -25
openlit/instrumentation/embedchain/__init__.py +11 -2
openlit/instrumentation/embedchain/embedchain.py +68 -35
openlit/instrumentation/firecrawl/__init__.py +24 -7
openlit/instrumentation/firecrawl/firecrawl.py +46 -20
openlit/instrumentation/google_ai_studio/__init__.py +45 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/google_ai_studio.py +67 -44
openlit/instrumentation/google_ai_studio/utils.py +180 -67
openlit/instrumentation/gpt4all/__init__.py +22 -7
openlit/instrumentation/gpt4all/gpt4all.py +67 -29
openlit/instrumentation/gpt4all/utils.py +285 -61
openlit/instrumentation/gpu/__init__.py +128 -47
openlit/instrumentation/groq/__init__.py +21 -4
openlit/instrumentation/groq/async_groq.py +33 -21
openlit/instrumentation/groq/groq.py +33 -21
openlit/instrumentation/groq/utils.py +192 -55
openlit/instrumentation/haystack/__init__.py +70 -24
openlit/instrumentation/haystack/async_haystack.py +28 -6
openlit/instrumentation/haystack/haystack.py +28 -6
openlit/instrumentation/haystack/utils.py +196 -74
openlit/instrumentation/julep/__init__.py +69 -19
openlit/instrumentation/julep/async_julep.py +53 -27
openlit/instrumentation/julep/julep.py +53 -28
openlit/instrumentation/langchain/__init__.py +74 -63
openlit/instrumentation/langchain/callback_handler.py +1100 -0
openlit/instrumentation/langchain_community/__init__.py +13 -2
openlit/instrumentation/langchain_community/async_langchain_community.py +23 -5
openlit/instrumentation/langchain_community/langchain_community.py +23 -5
openlit/instrumentation/langchain_community/utils.py +35 -9
openlit/instrumentation/letta/__init__.py +68 -15
openlit/instrumentation/letta/letta.py +99 -54
openlit/instrumentation/litellm/__init__.py +43 -14
openlit/instrumentation/litellm/async_litellm.py +51 -26
openlit/instrumentation/litellm/litellm.py +51 -26
openlit/instrumentation/litellm/utils.py +304 -102
openlit/instrumentation/llamaindex/__init__.py +267 -90
openlit/instrumentation/llamaindex/async_llamaindex.py +28 -6
openlit/instrumentation/llamaindex/llamaindex.py +28 -6
openlit/instrumentation/llamaindex/utils.py +204 -91
openlit/instrumentation/mem0/__init__.py +11 -2
openlit/instrumentation/mem0/mem0.py +50 -29
openlit/instrumentation/milvus/__init__.py +10 -2
openlit/instrumentation/milvus/milvus.py +31 -6
openlit/instrumentation/milvus/utils.py +166 -67
openlit/instrumentation/mistral/__init__.py +63 -18
openlit/instrumentation/mistral/async_mistral.py +63 -24
openlit/instrumentation/mistral/mistral.py +63 -24
openlit/instrumentation/mistral/utils.py +277 -69
openlit/instrumentation/multion/__init__.py +69 -19
openlit/instrumentation/multion/async_multion.py +57 -26
openlit/instrumentation/multion/multion.py +57 -26
openlit/instrumentation/ollama/__init__.py +39 -18
openlit/instrumentation/ollama/async_ollama.py +57 -26
openlit/instrumentation/ollama/ollama.py +57 -26
openlit/instrumentation/ollama/utils.py +226 -50
openlit/instrumentation/openai/__init__.py +156 -32
openlit/instrumentation/openai/async_openai.py +147 -67
openlit/instrumentation/openai/openai.py +150 -67
openlit/instrumentation/openai/utils.py +657 -185
openlit/instrumentation/openai_agents/__init__.py +5 -1
openlit/instrumentation/openai_agents/processor.py +110 -90
openlit/instrumentation/phidata/__init__.py +13 -5
openlit/instrumentation/phidata/phidata.py +67 -32
openlit/instrumentation/pinecone/__init__.py +48 -9
openlit/instrumentation/pinecone/async_pinecone.py +27 -5
openlit/instrumentation/pinecone/pinecone.py +27 -5
openlit/instrumentation/pinecone/utils.py +153 -47
openlit/instrumentation/premai/__init__.py +22 -7
openlit/instrumentation/premai/premai.py +51 -26
openlit/instrumentation/premai/utils.py +246 -59
openlit/instrumentation/pydantic_ai/__init__.py +49 -22
openlit/instrumentation/pydantic_ai/pydantic_ai.py +69 -16
openlit/instrumentation/pydantic_ai/utils.py +89 -24
openlit/instrumentation/qdrant/__init__.py +19 -4
openlit/instrumentation/qdrant/async_qdrant.py +33 -7
openlit/instrumentation/qdrant/qdrant.py +33 -7
openlit/instrumentation/qdrant/utils.py +228 -93
openlit/instrumentation/reka/__init__.py +23 -10
openlit/instrumentation/reka/async_reka.py +17 -11
openlit/instrumentation/reka/reka.py +17 -11
openlit/instrumentation/reka/utils.py +138 -36
openlit/instrumentation/together/__init__.py +44 -12
openlit/instrumentation/together/async_together.py +50 -27
openlit/instrumentation/together/together.py +50 -27
openlit/instrumentation/together/utils.py +301 -71
openlit/instrumentation/transformers/__init__.py +2 -1
openlit/instrumentation/transformers/transformers.py +13 -3
openlit/instrumentation/transformers/utils.py +139 -36
openlit/instrumentation/vertexai/__init__.py +81 -16
openlit/instrumentation/vertexai/async_vertexai.py +33 -15
openlit/instrumentation/vertexai/utils.py +123 -27
openlit/instrumentation/vertexai/vertexai.py +33 -15
openlit/instrumentation/vllm/__init__.py +12 -5
openlit/instrumentation/vllm/utils.py +121 -31
openlit/instrumentation/vllm/vllm.py +16 -10
openlit/otel/events.py +35 -10
openlit/otel/metrics.py +32 -24
openlit/otel/tracing.py +24 -9
openlit/semcov/__init__.py +72 -6
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/METADATA +2 -1
openlit-1.34.31.dist-info/RECORD +166 -0
openlit/instrumentation/langchain/async_langchain.py +0 -102
openlit/instrumentation/langchain/langchain.py +0 -102
openlit/instrumentation/langchain/utils.py +0 -252
openlit-1.34.30.dist-info/RECORD +0 -168
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/LICENSE +0 -0
{openlit-1.34.30.dist-info → openlit-1.34.31.dist-info}/WHEEL +0 -0

openlit/instrumentation/gpt4all/gpt4all.py CHANGED Viewed

@@ -4,20 +4,26 @@ Module for monitoring GPT4All API calls.
 import time
 from opentelemetry.trace import SpanKind
-from openlit.__helpers import (
-    handle_exception,
-    set_server_address_and_port
-)
+from openlit.__helpers import handle_exception, set_server_address_and_port
 from openlit.instrumentation.gpt4all.utils import (
     process_generate_response,
     process_chunk,
     process_streaming_generate_response,
-    process_embedding_response
+    process_embedding_response,
 )
 from openlit.semcov import SemanticConvention
-def generate(version, environment, application_name,
-    tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def generate(
+    version,
+    environment,
+    application_name,
+    tracer,
+    pricing_info,
+    capture_message_content,
+    metrics,
+    disable_metrics,
+):
     """
     Generates a telemetry wrapper for GenAI function call
     """
@@ -28,16 +34,16 @@ def generate(version, environment, application_name,
         """
         def __init__(
-                self,
-                wrapped,
-                span,
-                span_name,
-                args,
-                kwargs,
-                server_address,
-                server_port,
-                request_model,
-            ):
+            self,
+            wrapped,
+            span,
+            span_name,
+            args,
+            kwargs,
+            server_address,
+            server_port,
+            request_model,
+        ):
             self.__wrapped__ = wrapped
             self._span = span
             self._span_name = span_name
@@ -75,7 +81,9 @@ def generate(version, environment, application_name,
                 return chunk
             except StopIteration:
                 try:
-                    with tracer.start_as_current_span(self._span_name, kind=SpanKind.CLIENT) as self._span:
+                    with tracer.start_as_current_span(
+                        self._span_name, kind=SpanKind.CLIENT
+                    ) as self._span:
                         process_streaming_generate_response(
                             self,
                             pricing_info=pricing_info,
@@ -84,7 +92,7 @@ def generate(version, environment, application_name,
                             metrics=metrics,
                             capture_message_content=capture_message_content,
                             disable_metrics=disable_metrics,
-                            version=version
+                            version=version,
                         )
                 except Exception as e:
@@ -100,8 +108,13 @@ def generate(version, environment, application_name,
         # Check if streaming is enabled for the API call
         streaming = kwargs.get("streaming", False)
-        server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 80)
-        request_model = str(instance.model.model_path).rsplit("/", maxsplit=1)[-1] or "orca-mini-3b-gguf2-q4_0.gguf"
+        server_address, server_port = set_server_address_and_port(
+            instance, "127.0.0.1", 80
+        )
+        request_model = (
+            str(instance.model.model_path).rsplit("/", maxsplit=1)[-1]
+            or "orca-mini-3b-gguf2-q4_0.gguf"
+        )
         span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
@@ -109,7 +122,16 @@ def generate(version, environment, application_name,
             # Special handling for streaming response to accommodate the nature of data flow
             awaited_wrapped = wrapped(*args, **kwargs)
             span = tracer.start_span(span_name, kind=SpanKind.CLIENT)
-            return TracedSyncStream(awaited_wrapped, span, span_name, args, kwargs, server_address, server_port, request_model)
+            return TracedSyncStream(
+                awaited_wrapped,
+                span,
+                span_name,
+                args,
+                kwargs,
+                server_address,
+                server_port,
+                request_model,
+            )
         # Handling for non-streaming responses
         else:
@@ -133,7 +155,7 @@ def generate(version, environment, application_name,
                         kwargs=kwargs,
                         capture_message_content=capture_message_content,
                         disable_metrics=disable_metrics,
-                        version=version
+                        version=version,
                     )
                 except Exception as e:
@@ -143,8 +165,17 @@ def generate(version, environment, application_name,
     return wrapper
-def embed(version, environment, application_name,
-    tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def embed(
+    version,
+    environment,
+    application_name,
+    tracer,
+    pricing_info,
+    capture_message_content,
+    metrics,
+    disable_metrics,
+):
     """
     Generates a telemetry wrapper for GenAI function call
     """
@@ -154,10 +185,17 @@ def embed(version, environment, application_name,
         Wraps the GenAI function call.
         """
-        server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 80)
-        request_model = str(instance.gpt4all.model.model_path).rsplit("/", maxsplit=1)[-1] or "all-MiniLM-L6-v2.gguf2.f16.gguf"
+        server_address, server_port = set_server_address_and_port(
+            instance, "127.0.0.1", 80
+        )
+        request_model = (
+            str(instance.gpt4all.model.model_path).rsplit("/", maxsplit=1)[-1]
+            or "all-MiniLM-L6-v2.gguf2.f16.gguf"
+        )
-        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}"
+        span_name = (
+            f"{SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}"
+        )
         with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
             start_time = time.time()
@@ -178,7 +216,7 @@ def embed(version, environment, application_name,
                     capture_message_content=capture_message_content,
                     disable_metrics=disable_metrics,
                     version=version,
-                    **kwargs
+                    **kwargs,
                 )
             except Exception as e:

openlit/instrumentation/gpt4all/utils.py CHANGED Viewed

@@ -1,9 +1,14 @@
 """
 GPT4All OpenTelemetry instrumentation utility functions
 """
 import time
-from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from opentelemetry.sdk.resources import (
+    SERVICE_NAME,
+    TELEMETRY_SDK_NAME,
+    DEPLOYMENT_ENVIRONMENT,
+)
 from opentelemetry.trace import Status, StatusCode
 from openlit.__helpers import (
@@ -16,12 +21,14 @@ from openlit.__helpers import (
 )
 from openlit.semcov import SemanticConvention
 def format_content(prompt):
     """
     Process a prompt to extract content.
     """
     return str(prompt) if prompt else ""
 def process_chunk(scope, chunk):
     """
     Process a chunk of response data and update state.
@@ -38,8 +45,22 @@ def process_chunk(scope, chunk):
     scope._llmresponse += chunk
     scope._end_time = time.time()
-def common_span_attributes(scope, gen_ai_operation, gen_ai_system, server_address, server_port,
-    request_model, response_model, environment, application_name, is_stream, tbt, ttft, version):
+def common_span_attributes(
+    scope,
+    gen_ai_operation,
+    gen_ai_system,
+    server_address,
+    server_port,
+    request_model,
+    response_model,
+    environment,
+    application_name,
+    is_stream,
+    tbt,
+    ttft,
+    version,
+):
     """
     Set common span attributes for both generate and embed operations.
     """
@@ -58,9 +79,25 @@ def common_span_attributes(scope, gen_ai_operation, gen_ai_system, server_addres
     scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, ttft)
     scope._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION, version)
-def record_completion_metrics(metrics, gen_ai_operation, gen_ai_system, server_address, server_port,
-    request_model, response_model, environment, application_name, start_time, end_time,
-    input_tokens, output_tokens, cost, tbt=None, ttft=None):
+def record_completion_metrics(
+    metrics,
+    gen_ai_operation,
+    gen_ai_system,
+    server_address,
+    server_port,
+    request_model,
+    response_model,
+    environment,
+    application_name,
+    start_time,
+    end_time,
+    input_tokens,
+    output_tokens,
+    cost,
+    tbt=None,
+    ttft=None,
+):
     """
     Record completion-specific metrics for the operation.
     """
@@ -79,16 +116,31 @@ def record_completion_metrics(metrics, gen_ai_operation, gen_ai_system, server_a
     metrics["genai_requests"].add(1, attributes)
     metrics["genai_prompt_tokens"].add(input_tokens, attributes)
     metrics["genai_completion_tokens"].add(output_tokens, attributes)
-    metrics["genai_client_usage_tokens"].record(input_tokens + output_tokens, attributes)
+    metrics["genai_client_usage_tokens"].record(
+        input_tokens + output_tokens, attributes
+    )
     metrics["genai_cost"].record(cost, attributes)
     if tbt is not None:
         metrics["genai_server_tbt"].record(tbt, attributes)
     if ttft is not None:
         metrics["genai_server_ttft"].record(ttft, attributes)
-def record_embedding_metrics(metrics, gen_ai_operation, gen_ai_system, server_address, server_port,
-    request_model, response_model, environment, application_name, start_time, end_time,
-    input_tokens, cost):
+def record_embedding_metrics(
+    metrics,
+    gen_ai_operation,
+    gen_ai_system,
+    server_address,
+    server_port,
+    request_model,
+    response_model,
+    environment,
+    application_name,
+    start_time,
+    end_time,
+    input_tokens,
+    cost,
+):
     """
     Record embedding-specific metrics for the operation.
     """
@@ -109,8 +161,18 @@ def record_embedding_metrics(metrics, gen_ai_operation, gen_ai_system, server_ad
     metrics["genai_prompt_tokens"].add(input_tokens, attributes)
     metrics["genai_cost"].record(cost, attributes)
-def common_t2s_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version, is_stream):
+def common_t2s_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+    is_stream,
+):
     """
     Process generate request and generate Telemetry
     """
@@ -118,7 +180,9 @@ def common_t2s_logic(scope, pricing_info, environment, application_name, metrics
     if len(scope._timestamps) > 1:
         scope._tbt = calculate_tbt(scope._timestamps)
-    prompt = format_content(scope._kwargs.get("prompt") or (scope._args[0] if scope._args else "") or "")
+    prompt = format_content(
+        scope._kwargs.get("prompt") or (scope._args[0] if scope._args else "") or ""
+    )
     request_model = scope._request_model
     # Calculate tokens using input prompt and aggregated response
@@ -128,36 +192,80 @@ def common_t2s_logic(scope, pricing_info, environment, application_name, metrics
     cost = get_chat_model_cost(request_model, pricing_info, input_tokens, output_tokens)
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
-        scope._server_address, scope._server_port, request_model, request_model,
-        environment, application_name, is_stream, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+        SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        request_model,
+        environment,
+        application_name,
+        is_stream,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Span Attributes for Request parameters
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, scope._kwargs.get("repeat_penalty", 1.18))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, scope._kwargs.get("max_tokens", 200))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, scope._kwargs.get("presence_penalty", 0.0))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, scope._kwargs.get("temp", 0.7))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 0.4))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_K, scope._kwargs.get("top_k", 40))
-    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE, "text" if isinstance(scope._llmresponse, str) else "json")
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+        scope._kwargs.get("repeat_penalty", 1.18),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
+        scope._kwargs.get("max_tokens", 200),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
+        scope._kwargs.get("presence_penalty", 0.0),
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, scope._kwargs.get("temp", 0.7)
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TOP_P, scope._kwargs.get("top_p", 0.4)
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_REQUEST_TOP_K, scope._kwargs.get("top_k", 40)
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_OUTPUT_TYPE,
+        "text" if isinstance(scope._llmresponse, str) else "json",
+    )
     # Span Attributes for Cost and Tokens
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Tools
     if scope._tools:
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_NAME, scope._tools.get("function","")).get("name","")
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALL_ID, str(scope._tools.get("id","")))
-        scope._span.set_attribute(SemanticConvention.GEN_AI_TOOL_ARGS, str(scope._tools.get("function","").get("arguments","")))
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_NAME, scope._tools.get("function", "")
+        ).get("name", "")
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_CALL_ID, str(scope._tools.get("id", ""))
+        )
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_TOOL_ARGS,
+            str(scope._tools.get("function", "").get("arguments", "")),
+        )
     # Span Attributes for Content
     if capture_message_content:
         scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, prompt)
-        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse)
+        scope._span.set_attribute(
+            SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse
+        )
         # To be removed one the change to span_attributes (from span events) is complete
         scope._span.add_event(
@@ -177,13 +285,36 @@ def common_t2s_logic(scope, pricing_info, environment, application_name, metrics
     # Metrics
     if not disable_metrics:
-        record_completion_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT, SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
-            scope._server_address, scope._server_port, request_model, request_model, environment,
-            application_name, scope._start_time, scope._end_time, input_tokens, output_tokens,
-            cost, scope._tbt, scope._ttft)
+        record_completion_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            request_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            input_tokens,
+            output_tokens,
+            cost,
+            scope._tbt,
+            scope._ttft,
+        )
-def common_embedding_logic(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content, disable_metrics, version):
+def common_embedding_logic(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content,
+    disable_metrics,
+    version,
+):
     """
     Process embedding request and generate Telemetry
     """
@@ -196,14 +327,29 @@ def common_embedding_logic(scope, pricing_info, environment, application_name, m
     cost = get_embed_model_cost(request_model, pricing_info, input_tokens)
     # Common Span Attributes
-    common_span_attributes(scope,
-        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING, SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
-        scope._server_address, scope._server_port, request_model, request_model,
-        environment, application_name, False, scope._tbt, scope._ttft, version)
+    common_span_attributes(
+        scope,
+        SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+        SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
+        scope._server_address,
+        scope._server_port,
+        request_model,
+        request_model,
+        environment,
+        application_name,
+        False,
+        scope._tbt,
+        scope._ttft,
+        version,
+    )
     # Embedding-specific span attributes
-    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens)
-    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens)
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens
+    )
+    scope._span.set_attribute(
+        SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens
+    )
     scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
     # Span Attributes for Content
@@ -211,7 +357,9 @@ def common_embedding_logic(scope, pricing_info, environment, application_name, m
         scope._span.add_event(
             name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
             attributes={
-                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(scope._kwargs.get("input", "")),
+                SemanticConvention.GEN_AI_CONTENT_PROMPT: str(
+                    scope._kwargs.get("input", "")
+                ),
             },
         )
@@ -219,21 +367,66 @@ def common_embedding_logic(scope, pricing_info, environment, application_name, m
     # Metrics
     if not disable_metrics:
-        record_embedding_metrics(metrics, SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING, SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
-            scope._server_address, scope._server_port, request_model, request_model, environment,
-            application_name, scope._start_time, scope._end_time, input_tokens, cost)
+        record_embedding_metrics(
+            metrics,
+            SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+            SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
+            scope._server_address,
+            scope._server_port,
+            request_model,
+            request_model,
+            environment,
+            application_name,
+            scope._start_time,
+            scope._end_time,
+            input_tokens,
+            cost,
+        )
-def process_streaming_generate_response(scope, pricing_info, environment, application_name, metrics,
-    capture_message_content=False, disable_metrics=False, version=""):
+def process_streaming_generate_response(
+    scope,
+    pricing_info,
+    environment,
+    application_name,
+    metrics,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="",
+):
     """
     Process generate request and generate Telemetry
     """
-    common_t2s_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=True)
+    common_t2s_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=True,
+    )
-def process_generate_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, args, kwargs, capture_message_content=False,
-    disable_metrics=False, version="1.0.0"):
+def process_generate_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    args,
+    kwargs,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+):
     """
     Process generate request and generate Telemetry
     """
@@ -252,14 +445,37 @@ def process_generate_response(response, request_model, pricing_info, server_port
     scope._args = args
     scope._tools = None
-    common_t2s_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version, is_stream=False)
+    common_t2s_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+        is_stream=False,
+    )
     return response
-def process_embedding_response(response, request_model, pricing_info, server_port, server_address,
-    environment, application_name, metrics, start_time, span, capture_message_content=False,
-    disable_metrics=False, version="1.0.0", **kwargs):
+def process_embedding_response(
+    response,
+    request_model,
+    pricing_info,
+    server_port,
+    server_address,
+    environment,
+    application_name,
+    metrics,
+    start_time,
+    span,
+    capture_message_content=False,
+    disable_metrics=False,
+    version="1.0.0",
+    **kwargs,
+):
     """
     Process embedding request and generate Telemetry
     """
@@ -275,7 +491,15 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     scope._server_address, scope._server_port = server_address, server_port
     scope._kwargs = kwargs
-    common_embedding_logic(scope, pricing_info, environment, application_name, metrics,
-        capture_message_content, disable_metrics, version)
+    common_embedding_logic(
+        scope,
+        pricing_info,
+        environment,
+        application_name,
+        metrics,
+        capture_message_content,
+        disable_metrics,
+        version,
+    )
     return response

openlit 1.34.30__py3-none-any.whl → 1.34.31__py3-none-any.whl

openlit 1.34.30py3-none-any.whl → 1.34.31py3-none-any.whl