PyPI - openlit - Versions diffs - 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl - Mend

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

openlit/__helpers.py +64 -7
openlit/__init__.py +3 -3
openlit/evals/utils.py +7 -7
openlit/guard/utils.py +7 -7
openlit/instrumentation/ag2/ag2.py +24 -24
openlit/instrumentation/ai21/ai21.py +3 -3
openlit/instrumentation/ai21/async_ai21.py +3 -3
openlit/instrumentation/ai21/utils.py +59 -59
openlit/instrumentation/anthropic/anthropic.py +2 -2
openlit/instrumentation/anthropic/async_anthropic.py +2 -2
openlit/instrumentation/anthropic/utils.py +34 -34
openlit/instrumentation/assemblyai/assemblyai.py +24 -24
openlit/instrumentation/astra/astra.py +3 -3
openlit/instrumentation/astra/async_astra.py +3 -3
openlit/instrumentation/astra/utils.py +39 -39
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/utils.py +36 -36
openlit/instrumentation/bedrock/bedrock.py +2 -2
openlit/instrumentation/bedrock/utils.py +35 -35
openlit/instrumentation/chroma/chroma.py +57 -57
openlit/instrumentation/cohere/async_cohere.py +88 -88
openlit/instrumentation/cohere/cohere.py +88 -88
openlit/instrumentation/controlflow/controlflow.py +15 -15
openlit/instrumentation/crawl4ai/async_crawl4ai.py +14 -14
openlit/instrumentation/crawl4ai/crawl4ai.py +14 -14
openlit/instrumentation/crewai/crewai.py +22 -22
openlit/instrumentation/dynamiq/dynamiq.py +19 -19
openlit/instrumentation/elevenlabs/async_elevenlabs.py +24 -25
openlit/instrumentation/elevenlabs/elevenlabs.py +23 -25
openlit/instrumentation/embedchain/embedchain.py +15 -15
openlit/instrumentation/firecrawl/firecrawl.py +10 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +33 -33
openlit/instrumentation/google_ai_studio/google_ai_studio.py +33 -33
openlit/instrumentation/gpt4all/gpt4all.py +78 -78
openlit/instrumentation/gpu/__init__.py +8 -8
openlit/instrumentation/groq/async_groq.py +74 -74
openlit/instrumentation/groq/groq.py +74 -74
openlit/instrumentation/haystack/haystack.py +6 -6
openlit/instrumentation/julep/async_julep.py +14 -14
openlit/instrumentation/julep/julep.py +14 -14
openlit/instrumentation/langchain/async_langchain.py +39 -39
openlit/instrumentation/langchain/langchain.py +39 -39
openlit/instrumentation/letta/letta.py +26 -26
openlit/instrumentation/litellm/async_litellm.py +94 -94
openlit/instrumentation/litellm/litellm.py +94 -94
openlit/instrumentation/llamaindex/llamaindex.py +7 -7
openlit/instrumentation/mem0/mem0.py +13 -13
openlit/instrumentation/milvus/milvus.py +47 -47
openlit/instrumentation/mistral/async_mistral.py +88 -88
openlit/instrumentation/mistral/mistral.py +88 -88
openlit/instrumentation/multion/async_multion.py +21 -21
openlit/instrumentation/multion/multion.py +21 -21
openlit/instrumentation/ollama/__init__.py +47 -34
openlit/instrumentation/ollama/async_ollama.py +7 -5
openlit/instrumentation/ollama/ollama.py +7 -5
openlit/instrumentation/ollama/utils.py +58 -54
openlit/instrumentation/openai/async_openai.py +225 -225
openlit/instrumentation/openai/openai.py +225 -225
openlit/instrumentation/openai_agents/openai_agents.py +11 -11
openlit/instrumentation/phidata/phidata.py +15 -15
openlit/instrumentation/pinecone/pinecone.py +43 -43
openlit/instrumentation/premai/premai.py +86 -86
openlit/instrumentation/qdrant/async_qdrant.py +95 -95
openlit/instrumentation/qdrant/qdrant.py +99 -99
openlit/instrumentation/reka/async_reka.py +33 -33
openlit/instrumentation/reka/reka.py +33 -33
openlit/instrumentation/together/async_together.py +90 -90
openlit/instrumentation/together/together.py +90 -90
openlit/instrumentation/transformers/__init__.py +11 -7
openlit/instrumentation/transformers/transformers.py +32 -168
openlit/instrumentation/transformers/utils.py +183 -0
openlit/instrumentation/vertexai/async_vertexai.py +64 -64
openlit/instrumentation/vertexai/vertexai.py +64 -64
openlit/instrumentation/vllm/vllm.py +24 -24
openlit/otel/metrics.py +11 -11
openlit/semcov/__init__.py +3 -3
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/METADATA +8 -8
openlit-1.33.21.dist-info/RECORD +132 -0
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/WHEEL +1 -1
openlit-1.33.19.dist-info/RECORD +0 -131
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/LICENSE +0 -0

openlit/instrumentation/ollama/__init__.py CHANGED Viewed

@@ -16,6 +16,29 @@ from openlit.instrumentation.ollama.async_ollama import (
 _instruments = ("ollama >= 0.2.0",)
+# Dispatch wrapper to route instrumentation to chat or embeddings based on path
+def _dispatch(sync_chat_wrap, sync_emb_wrap):
+    def wrapper(wrapped, instance, args, kwargs):
+        if len(args) > 2 and isinstance(args[2], str):
+            op = args[2].rstrip("/").split("/")[-1]
+            if op == "chat":
+                return sync_chat_wrap(wrapped, instance, args, kwargs)
+            if op == "embeddings":
+                return sync_emb_wrap(wrapped, instance, args, kwargs)
+        return wrapped(*args, **kwargs)
+    return wrapper
+def _dispatch_async(async_chat_wrap, async_emb_wrap):
+    async def wrapper(wrapped, instance, args, kwargs):
+        if len(args) > 2 and isinstance(args[2], str):
+            op = args[2].rstrip("/").split("/")[-1]
+            if op == "chat":
+                return await async_chat_wrap(wrapped, instance, args, kwargs)
+            if op == "embeddings":
+                return await async_emb_wrap(wrapped, instance, args, kwargs)
+        return await wrapped(*args, **kwargs)
+    return wrapper
 class OllamaInstrumentor(BaseInstrumentor):
     """
     An instrumentor for Ollama's client library.
@@ -35,48 +58,38 @@ class OllamaInstrumentor(BaseInstrumentor):
         disable_metrics = kwargs.get("disable_metrics")
         version = importlib.metadata.version("ollama")
-        # sync chat
-        wrap_function_wrapper(
-            "ollama",
-            "chat",
-            chat(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+        # Build wrapper factories for chat and embeddings
+        sync_chat_wrap = chat(
+            version, environment, application_name,
+            tracer, event_provider, pricing_info,
+            capture_message_content, metrics, disable_metrics
         )
-        wrap_function_wrapper(
-            "ollama",
-            "Client.chat",
-            chat(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+        sync_emb_wrap = embeddings(
+            version, environment, application_name,
+            tracer, event_provider, pricing_info,
+            capture_message_content, metrics, disable_metrics
         )
-        # sync embeddings
-        wrap_function_wrapper(
-            "ollama",
-            "embeddings",
-            embeddings(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+        async_chat_wrap = async_chat(
+            version, environment, application_name,
+            tracer, event_provider, pricing_info,
+            capture_message_content, metrics, disable_metrics
         )
-        wrap_function_wrapper(
-            "ollama",
-            "Client.embeddings",
-            embeddings(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+        async_emb_wrap = async_embeddings(
+            version, environment, application_name,
+            tracer, event_provider, pricing_info,
+            capture_message_content, metrics, disable_metrics
         )
-        # async chat
+        # Patch underlying request methods to ensure instrumentation regardless of import order
         wrap_function_wrapper(
-            "ollama",
-            "AsyncClient.chat",
-            async_chat(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+            "ollama._client",
+            "Client._request",
+            _dispatch(sync_chat_wrap, sync_emb_wrap),
         )
-        # async embeddings
         wrap_function_wrapper(
-            "ollama",
-            "AsyncClient.embeddings",
-            async_embeddings(version, environment, application_name,
-                  tracer, event_provider, pricing_info, capture_message_content, metrics, disable_metrics),
+            "ollama._client",
+            "AsyncClient._request",
+            _dispatch_async(async_chat_wrap, async_emb_wrap),
         )
     def _uninstrument(self, **kwargs):

openlit/instrumentation/ollama/async_ollama.py CHANGED Viewed

@@ -15,7 +15,7 @@ from openlit.instrumentation.ollama.utils import (
     process_streaming_chat_response,
     process_embedding_response
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 logger = logging.getLogger(__name__)
@@ -106,9 +106,10 @@ def async_chat(version, environment, application_name,
         streaming = kwargs.get("stream", False)
         server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 11434)
-        request_model = kwargs.get("model", "gpt-4o")
+        json_body = kwargs.get("json", {}) or {}
+        request_model = json_body.get("model") or kwargs.get("model")
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -154,9 +155,10 @@ def async_embeddings(version, environment, application_name,
         """
         server_address, server_port = set_server_address_and_port(instance, '127.0.0.1', 11434)
-        request_model = kwargs.get('model', 'all-minilm')
+        json_body = kwargs.get('json', {}) or {}
+        request_model = json_body.get('model') or kwargs.get('model')
-        span_name = f'{SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}'
+        span_name = f'{SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}'
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
             start_time = time.time()

openlit/instrumentation/ollama/ollama.py CHANGED Viewed

@@ -15,7 +15,7 @@ from openlit.instrumentation.ollama.utils import (
     process_streaming_chat_response,
     process_embedding_response
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 logger = logging.getLogger(__name__)
@@ -106,9 +106,10 @@ def chat(version, environment, application_name,
         streaming = kwargs.get("stream", False)
         server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 11434)
-        request_model = kwargs.get("model", "gpt-4o")
+        json_body = kwargs.get("json", {}) or {}
+        request_model = json_body.get("model") or kwargs.get("model")
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -154,9 +155,10 @@ def embeddings(version, environment, application_name,
         """
         server_address, server_port = set_server_address_and_port(instance, '127.0.0.1', 11434)
-        request_model = kwargs.get('model', 'all-minilm')
+        json_body = kwargs.get('json', {}) or {}
+        request_model = json_body.get('model') or kwargs.get('model')
-        span_name = f'{SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}'
+        span_name = f'{SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}'
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
             start_time = time.time()

openlit/instrumentation/ollama/utils.py CHANGED Viewed

@@ -19,7 +19,7 @@ from openlit.__helpers import (
     otel_event,
     concatenate_all_contents
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 def process_chunk(self, chunk):
     """
@@ -57,27 +57,29 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     if len(scope._timestamps) > 1:
         scope._tbt = calculate_tbt(scope._timestamps)
-    formatted_messages = extract_and_format_input(scope._kwargs.get("messages", ""))
-    request_model = scope._kwargs.get("model", "gpt-4o")
+    json_body = scope._kwargs.get("json", {}) or {}
+    request_model = json_body.get("model") or scope._kwargs.get("model")
+    messages = json_body.get("messages", scope._kwargs.get("messages", ""))
+    formatted_messages = extract_and_format_input(messages)
     cost = get_chat_model_cost(request_model, pricing_info, scope._input_tokens, scope._output_tokens)
     # Set Span attributes (OTel Semconv)
     scope._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION, SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM, SemanticConvetion.GEN_AI_SYSTEM_OLLAMA)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL, request_model)
-    scope._span.set_attribute(SemanticConvetion.SERVER_PORT, scope._server_port)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_OPERATION, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM, SemanticConvention.GEN_AI_SYSTEM_OLLAMA)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL, request_model)
+    scope._span.set_attribute(SemanticConvention.SERVER_PORT, scope._server_port)
     options = scope._kwargs.get('options', {})
     attributes = [
-        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'repeat_penalty'),
-        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
-        (SemanticConvetion.GEN_AI_REQUEST_SEED, 'seed'),
-        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop'),
-        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'repeat_penalty'),
+        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
+        (SemanticConvention.GEN_AI_REQUEST_SEED, 'seed'),
+        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop'),
+        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
     ]
     for attribute, key in attributes:
@@ -85,37 +87,37 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
         if value is not None:
             scope._span.set_attribute(attribute, value)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL, scope._response_model)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
-    scope._span.set_attribute(SemanticConvetion.SERVER_ADDRESS, scope._server_address)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON, [scope._finish_reason])
+    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL, scope._response_model)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, scope._input_tokens)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, scope._output_tokens)
+    scope._span.set_attribute(SemanticConvention.SERVER_ADDRESS, scope._server_address)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+    scope._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                               "text" if isinstance(scope._llmresponse, str) else "json")
     scope._span.set_attribute(DEPLOYMENT_ENVIRONMENT, environment)
     scope._span.set_attribute(SERVICE_NAME, application_name)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM, is_stream)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST, cost)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT, scope._tbt)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT, scope._ttft)
-    scope._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION, version)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM, is_stream)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, scope._input_tokens + scope._output_tokens)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT, scope._tbt)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, scope._ttft)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION, version)
     # To be removed one the change to log events (from span events) is complete
     prompt = concatenate_all_contents(formatted_messages)
     if capture_message_content:
         scope._span.add_event(
-            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
             attributes={
-                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
             },
         )
         scope._span.add_event(
-            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
             attributes={
-                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: scope._llmresponse,
+                SemanticConvention.GEN_AI_CONTENT_COMPLETION: scope._llmresponse,
             },
         )
@@ -145,9 +147,9 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
     for role in ['user', 'system', 'assistant', 'tool']:
         if formatted_messages.get(role, {}).get('content', ''):
             event = otel_event(
-                name=getattr(SemanticConvetion, f'GEN_AI_{role.upper()}_MESSAGE'),
+                name=getattr(SemanticConvention, f'GEN_AI_{role.upper()}_MESSAGE'),
                 attributes={
-                    SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+                    SemanticConvention.GEN_AI_SYSTEM: SemanticConvention.GEN_AI_SYSTEM_OLLAMA
                 },
                 body = {
                     # pylint: disable=line-too-long
@@ -172,9 +174,9 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
             event_provider.emit(event)
     choice_event = otel_event(
-        name=SemanticConvetion.GEN_AI_CHOICE,
+        name=SemanticConvention.GEN_AI_CHOICE,
         attributes={
-            SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+            SemanticConvention.GEN_AI_SYSTEM: SemanticConvention.GEN_AI_SYSTEM_OLLAMA
         },
         body=choice_event_body
     )
@@ -186,8 +188,8 @@ def common_chat_logic(scope, pricing_info, environment, application_name, metric
         metrics_attributes = create_metrics_attributes(
             service_name=application_name,
             deployment_environment=environment,
-            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-            system=SemanticConvetion.GEN_AI_SYSTEM_OLLAMA,
+            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            system=SemanticConvention.GEN_AI_SYSTEM_OLLAMA,
             request_model=request_model,
             server_address=scope._server_address,
             server_port=scope._server_port,
@@ -252,7 +254,9 @@ def process_embedding_response(response, request_model, pricing_info, server_por
     end_time = time.time()
     try:
-        input_tokens = general_tokens(str(kwargs.get('prompt')))
+        json_body = kwargs.get("json", {}) or {}
+        prompt_val = json_body.get('prompt', kwargs.get('prompt', ''))
+        input_tokens = general_tokens(str(prompt_val))
         # Calculate cost of the operation
         cost = get_embed_model_cost(request_model,
@@ -260,19 +264,19 @@ def process_embedding_response(response, request_model, pricing_info, server_por
         # Set Span attributes (OTel Semconv)
         span.set_attribute(TELEMETRY_SDK_NAME, 'openlit')
-        span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                            SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING)
-        span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                            SemanticConvetion.GEN_AI_SYSTEM_OLLAMA)
-        span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+        span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                            SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING)
+        span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                            SemanticConvention.GEN_AI_SYSTEM_OLLAMA)
+        span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                             request_model)
-        span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+        span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                             request_model)
-        span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+        span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                             server_address)
-        span.set_attribute(SemanticConvetion.SERVER_PORT,
+        span.set_attribute(SemanticConvention.SERVER_PORT,
                             server_port)
-        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+        span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                             input_tokens)
         # Set Span attributes (Extras)
@@ -280,20 +284,20 @@ def process_embedding_response(response, request_model, pricing_info, server_por
                             environment)
         span.set_attribute(SERVICE_NAME,
                             application_name)
-        span.set_attribute(SemanticConvetion.GEN_AI_CLIENT_TOKEN_USAGE,
+        span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE,
                             input_tokens)
-        span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+        span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                             cost)
-        span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+        span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                             version)
         prompt_event = otel_event(
-            name=SemanticConvetion.GEN_AI_USER_MESSAGE,
+            name=SemanticConvention.GEN_AI_USER_MESSAGE,
             attributes={
-                SemanticConvetion.GEN_AI_SYSTEM: SemanticConvetion.GEN_AI_SYSTEM_OLLAMA
+                SemanticConvention.GEN_AI_SYSTEM: SemanticConvention.GEN_AI_SYSTEM_OLLAMA
             },
             body={
-                **({"content": kwargs.get('prompt', '')} if capture_message_content else {}),
+                **({"content": prompt_val} if capture_message_content else {}),
                 "role":  'user'
             }
         )
@@ -305,8 +309,8 @@ def process_embedding_response(response, request_model, pricing_info, server_por
             attributes = create_metrics_attributes(
                 service_name=application_name,
                 deployment_environment=environment,
-                operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING,
-                system=SemanticConvetion.GEN_AI_SYSTEM_OLLAMA,
+                operation=SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+                system=SemanticConvention.GEN_AI_SYSTEM_OLLAMA,
                 request_model=request_model,
                 server_address=server_address,
                 server_port=server_port,

openlit 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl