PyPI - openlit - Versions diffs - 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl - Mend

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

openlit/__helpers.py +64 -7
openlit/__init__.py +3 -3
openlit/evals/utils.py +7 -7
openlit/guard/utils.py +7 -7
openlit/instrumentation/ag2/ag2.py +24 -24
openlit/instrumentation/ai21/ai21.py +3 -3
openlit/instrumentation/ai21/async_ai21.py +3 -3
openlit/instrumentation/ai21/utils.py +59 -59
openlit/instrumentation/anthropic/anthropic.py +2 -2
openlit/instrumentation/anthropic/async_anthropic.py +2 -2
openlit/instrumentation/anthropic/utils.py +34 -34
openlit/instrumentation/assemblyai/assemblyai.py +24 -24
openlit/instrumentation/astra/astra.py +3 -3
openlit/instrumentation/astra/async_astra.py +3 -3
openlit/instrumentation/astra/utils.py +39 -39
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/utils.py +36 -36
openlit/instrumentation/bedrock/bedrock.py +2 -2
openlit/instrumentation/bedrock/utils.py +35 -35
openlit/instrumentation/chroma/chroma.py +57 -57
openlit/instrumentation/cohere/async_cohere.py +88 -88
openlit/instrumentation/cohere/cohere.py +88 -88
openlit/instrumentation/controlflow/controlflow.py +15 -15
openlit/instrumentation/crawl4ai/async_crawl4ai.py +14 -14
openlit/instrumentation/crawl4ai/crawl4ai.py +14 -14
openlit/instrumentation/crewai/crewai.py +22 -22
openlit/instrumentation/dynamiq/dynamiq.py +19 -19
openlit/instrumentation/elevenlabs/async_elevenlabs.py +24 -25
openlit/instrumentation/elevenlabs/elevenlabs.py +23 -25
openlit/instrumentation/embedchain/embedchain.py +15 -15
openlit/instrumentation/firecrawl/firecrawl.py +10 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +33 -33
openlit/instrumentation/google_ai_studio/google_ai_studio.py +33 -33
openlit/instrumentation/gpt4all/gpt4all.py +78 -78
openlit/instrumentation/gpu/__init__.py +8 -8
openlit/instrumentation/groq/async_groq.py +74 -74
openlit/instrumentation/groq/groq.py +74 -74
openlit/instrumentation/haystack/haystack.py +6 -6
openlit/instrumentation/julep/async_julep.py +14 -14
openlit/instrumentation/julep/julep.py +14 -14
openlit/instrumentation/langchain/async_langchain.py +39 -39
openlit/instrumentation/langchain/langchain.py +39 -39
openlit/instrumentation/letta/letta.py +26 -26
openlit/instrumentation/litellm/async_litellm.py +94 -94
openlit/instrumentation/litellm/litellm.py +94 -94
openlit/instrumentation/llamaindex/llamaindex.py +7 -7
openlit/instrumentation/mem0/mem0.py +13 -13
openlit/instrumentation/milvus/milvus.py +47 -47
openlit/instrumentation/mistral/async_mistral.py +88 -88
openlit/instrumentation/mistral/mistral.py +88 -88
openlit/instrumentation/multion/async_multion.py +21 -21
openlit/instrumentation/multion/multion.py +21 -21
openlit/instrumentation/ollama/__init__.py +47 -34
openlit/instrumentation/ollama/async_ollama.py +7 -5
openlit/instrumentation/ollama/ollama.py +7 -5
openlit/instrumentation/ollama/utils.py +58 -54
openlit/instrumentation/openai/async_openai.py +225 -225
openlit/instrumentation/openai/openai.py +225 -225
openlit/instrumentation/openai_agents/openai_agents.py +11 -11
openlit/instrumentation/phidata/phidata.py +15 -15
openlit/instrumentation/pinecone/pinecone.py +43 -43
openlit/instrumentation/premai/premai.py +86 -86
openlit/instrumentation/qdrant/async_qdrant.py +95 -95
openlit/instrumentation/qdrant/qdrant.py +99 -99
openlit/instrumentation/reka/async_reka.py +33 -33
openlit/instrumentation/reka/reka.py +33 -33
openlit/instrumentation/together/async_together.py +90 -90
openlit/instrumentation/together/together.py +90 -90
openlit/instrumentation/transformers/__init__.py +11 -7
openlit/instrumentation/transformers/transformers.py +32 -168
openlit/instrumentation/transformers/utils.py +183 -0
openlit/instrumentation/vertexai/async_vertexai.py +64 -64
openlit/instrumentation/vertexai/vertexai.py +64 -64
openlit/instrumentation/vllm/vllm.py +24 -24
openlit/otel/metrics.py +11 -11
openlit/semcov/__init__.py +3 -3
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/METADATA +8 -8
openlit-1.33.21.dist-info/RECORD +132 -0
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/WHEEL +1 -1
openlit-1.33.19.dist-info/RECORD +0 -131
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/LICENSE +0 -0

openlit/instrumentation/transformers/utils.py ADDED Viewed

@@ -0,0 +1,183 @@
+"""
+HF Transformers OpenTelemetry instrumentation utility functions
+"""
+import time
+from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from opentelemetry.trace import Status, StatusCode
+from openlit.__helpers import (
+    response_as_dict,
+    calculate_tbt,
+    general_tokens,
+    get_chat_model_cost,
+    create_metrics_attributes,
+    format_and_concatenate
+)
+from openlit.semcov import SemanticConvention
+def common_chat_logic(scope, pricing_info, environment, application_name, metrics,
+    capture_message_content, disable_metrics, version, args, kwargs, is_stream):
+    """
+    Process chat request and generate Telemetry
+    """
+    scope._end_time = time.time()
+    if len(scope._timestamps) > 1:
+        scope._tbt = calculate_tbt(scope._timestamps)
+    forward_params = scope._instance._forward_params
+    request_model = scope._instance.model.config.name_or_path
+    input_tokens = general_tokens(scope._prompt)
+    output_tokens = general_tokens(scope._llmresponse)
+    cost = get_chat_model_cost(request_model, pricing_info, input_tokens, output_tokens)
+    # Set Span attributes (OTel Semconv)
+    scope._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
+    scope._span.set_attribute(SemanticConvention.GEN_AI_OPERATION, SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM, SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL, request_model)
+    scope._span.set_attribute(SemanticConvention.SERVER_PORT, scope._server_port)
+    # List of attributes and their config keys
+    attributes = [
+        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, "temperature"),
+        (SemanticConvention.GEN_AI_REQUEST_TOP_K, "top_k"),
+        (SemanticConvention.GEN_AI_REQUEST_TOP_P, "top_p"),
+        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, "max_length"),
+    ]
+    # Set each attribute if the corresponding value exists and is not None
+    for attribute, key in attributes:
+        value = forward_params.get(key)
+        if value is not None:
+            scope._span.set_attribute(attribute, value)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL, request_model)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS, input_tokens)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens)
+    scope._span.set_attribute(SemanticConvention.SERVER_ADDRESS, scope._server_address)
+    scope._span.set_attribute(DEPLOYMENT_ENVIRONMENT, environment)
+    scope._span.set_attribute(SERVICE_NAME, application_name)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM, is_stream)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_CLIENT_TOKEN_USAGE, input_tokens + output_tokens)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST, cost)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT, scope._tbt)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT, scope._ttft)
+    scope._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION, version)
+    # To be removed one the change to span_attributes (from span events) is complete
+    if capture_message_content:
+        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_PROMPT, scope._prompt)
+        scope._span.set_attribute(SemanticConvention.GEN_AI_CONTENT_COMPLETION, scope._llmresponse,)
+        scope._span.add_event(
+            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
+            attributes={
+                SemanticConvention.GEN_AI_CONTENT_PROMPT: scope._prompt,
+            },
+        )
+        scope._span.add_event(
+            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
+            attributes={
+                SemanticConvention.GEN_AI_CONTENT_COMPLETION: scope._llmresponse,
+            },
+        )
+    scope._span.set_status(Status(StatusCode.OK))
+    if not disable_metrics:
+        metrics_attributes = create_metrics_attributes(
+            service_name=application_name,
+            deployment_environment=environment,
+            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+            system=SemanticConvention.GEN_AI_SYSTEM_HUGGING_FACE,
+            request_model=request_model,
+            server_address=scope._server_address,
+            server_port=scope._server_port,
+            response_model=request_model,
+        )
+        metrics["genai_client_usage_tokens"].record(input_tokens + output_tokens, metrics_attributes)
+        metrics["genai_client_operation_duration"].record(scope._end_time - scope._start_time, metrics_attributes)
+        metrics["genai_server_tbt"].record(scope._tbt, metrics_attributes)
+        metrics["genai_server_ttft"].record(scope._ttft, metrics_attributes)
+        metrics["genai_requests"].add(1, metrics_attributes)
+        metrics["genai_completion_tokens"].add(output_tokens, metrics_attributes)
+        metrics["genai_prompt_tokens"].add(input_tokens, metrics_attributes)
+        metrics["genai_cost"].record(cost, metrics_attributes)
+def process_chat_response(instance, response, request_model, pricing_info, server_port, server_address,
+                          environment, application_name, metrics, start_time,
+                          span, args, kwargs, capture_message_content=False, disable_metrics=False, version="1.0.0"):
+    """
+    Process chat request and generate Telemetry
+    """
+    self = type("GenericScope", (), {})()
+    response_dict = response_as_dict(response)
+    # pylint: disable = no-member
+    self._instance = instance
+    self._start_time = start_time
+    self._end_time = time.time()
+    self._span = span
+    self._timestamps = []
+    self._ttft, self._tbt = self._end_time - self._start_time, 0
+    self._server_address, self._server_port = server_address, server_port
+    self._kwargs = kwargs
+    self._args = args
+    if self._args and len(self._args) > 0:
+        self._prompt = args[0]
+    else:
+        self._prompt = (
+            kwargs.get("text_inputs") or
+            (kwargs.get("image") and kwargs.get("question") and
+            ("image: " + kwargs.get("image") + " question:" + kwargs.get("question"))) or
+            kwargs.get("fallback") or
+            ""
+        )
+    self._prompt = format_and_concatenate(self._prompt)
+    self._llmresponse = []
+    if self._kwargs.get("task", "text-generation") == "text-generation":
+        first_entry = response_dict[0]
+        if isinstance(first_entry, dict) and isinstance(first_entry.get("generated_text"), list):
+            last_element = first_entry.get("generated_text")[-1]
+            self._llmresponse = last_element.get("content", last_element)
+        else:
+            def extract_text(entry):
+                if isinstance(entry, dict):
+                    return entry.get("generated_text")
+                if isinstance(entry, list):
+                    return " ".join(
+                        extract_text(sub_entry) for sub_entry in entry if isinstance(sub_entry, dict)
+                    )
+                return ""
+            # Process and collect all generated texts
+            self._llmresponse = [
+                extract_text(entry) for entry in response_dict
+            ]
+            # Join all non-empty responses into a single string
+            self._llmresponse = " ".join(filter(None, self._llmresponse))
+    elif self._kwargs.get("task", "text-generation") == "automatic-speech-recognition":
+        self._llmresponse = response_dict.get("text", "")
+    elif self._kwargs.get("task", "text-generation") == "image-classification":
+        self._llmresponse = str(response_dict[0])
+    elif self._kwargs.get("task", "text-generation") == "visual-question-answering":
+        self._llmresponse = str(response_dict[0]).get("answer")
+    common_chat_logic(self, pricing_info, environment, application_name, metrics,
+            capture_message_content, disable_metrics, version, args, kwargs, is_stream=False)
+    return response

openlit/instrumentation/vertexai/async_vertexai.py CHANGED Viewed

@@ -13,7 +13,7 @@ from openlit.__helpers import (
     calculate_tbt,
     create_metrics_attributes,
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -139,26 +139,26 @@ def async_send_message(version, environment, application_name, tracer,
                     # Set Span attributes (OTel Semconv)
                     self._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    self._span.set_attribute(SemanticConvention.SERVER_PORT,
                                         self._server_port)
                     inference_config = self._kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -168,19 +168,19 @@ def async_send_message(version, environment, application_name, tracer,
                         if value is not None:
                             self._span.set_attribute(attribute, value)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         self._input_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    self._span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         self._server_address)
                     if isinstance(self._llmresponse, str):
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -188,29 +188,29 @@ def async_send_message(version, environment, application_name, tracer,
                                         environment)
                     self._span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         True)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         self._input_tokens + self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT,
                                         self._tbt)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         self._ttft)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
                             },
                         )
                     self._span.set_status(Status(StatusCode.OK))
@@ -219,8 +219,8 @@ def async_send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=self._request_model,
                             server_address=self._server_address,
                             server_port=self._server_port,
@@ -280,7 +280,7 @@ def async_send_message(version, environment, application_name, tracer,
         server_address, server_port = location + '-aiplatform.googleapis.com', 443
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -342,26 +342,26 @@ def async_send_message(version, environment, application_name, tracer,
                     # Set base span attribues (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
                     inference_config = kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -371,15 +371,15 @@ def async_send_message(version, environment, application_name, tracer,
                         if value is not None:
                             span.set_attribute(attribute, value)
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
-                    # span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                    # span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                     #                     [str(response.candidates[0].finish_reason)])
                     # Set base span attribues (Extras)
@@ -387,35 +387,35 @@ def async_send_message(version, environment, application_name, tracer,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         False)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         end_time - start_time)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: response.text,
                             },
                         )
                         if isinstance(response.text, str):
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "text")
                         elif response.text is not None:
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "json")
                     span.set_status(Status(StatusCode.OK))
@@ -424,8 +424,8 @@ def async_send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=request_model,
                             server_address=server_address,
                             server_port=server_port,

openlit 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl