PyPI - openlit - Versions diffs - 1.33.19__py3-none-any.whl → 1.33.20__py3-none-any.whl - Mend

openlit 1.33.19py3-none-any.whl → 1.33.20py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (79) hide show

openlit/__helpers.py +7 -7
openlit/__init__.py +3 -3
openlit/evals/utils.py +7 -7
openlit/guard/utils.py +7 -7
openlit/instrumentation/ag2/ag2.py +24 -24
openlit/instrumentation/ai21/ai21.py +3 -3
openlit/instrumentation/ai21/async_ai21.py +3 -3
openlit/instrumentation/ai21/utils.py +59 -59
openlit/instrumentation/anthropic/anthropic.py +2 -2
openlit/instrumentation/anthropic/async_anthropic.py +2 -2
openlit/instrumentation/anthropic/utils.py +34 -34
openlit/instrumentation/assemblyai/assemblyai.py +24 -24
openlit/instrumentation/astra/astra.py +3 -3
openlit/instrumentation/astra/async_astra.py +3 -3
openlit/instrumentation/astra/utils.py +39 -39
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/utils.py +36 -36
openlit/instrumentation/bedrock/bedrock.py +2 -2
openlit/instrumentation/bedrock/utils.py +35 -35
openlit/instrumentation/chroma/chroma.py +57 -57
openlit/instrumentation/cohere/async_cohere.py +88 -88
openlit/instrumentation/cohere/cohere.py +88 -88
openlit/instrumentation/controlflow/controlflow.py +15 -15
openlit/instrumentation/crawl4ai/async_crawl4ai.py +14 -14
openlit/instrumentation/crawl4ai/crawl4ai.py +14 -14
openlit/instrumentation/crewai/crewai.py +22 -22
openlit/instrumentation/dynamiq/dynamiq.py +19 -19
openlit/instrumentation/elevenlabs/async_elevenlabs.py +24 -25
openlit/instrumentation/elevenlabs/elevenlabs.py +23 -25
openlit/instrumentation/embedchain/embedchain.py +15 -15
openlit/instrumentation/firecrawl/firecrawl.py +10 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +33 -33
openlit/instrumentation/google_ai_studio/google_ai_studio.py +33 -33
openlit/instrumentation/gpt4all/gpt4all.py +78 -78
openlit/instrumentation/gpu/__init__.py +8 -8
openlit/instrumentation/groq/async_groq.py +74 -74
openlit/instrumentation/groq/groq.py +74 -74
openlit/instrumentation/haystack/haystack.py +6 -6
openlit/instrumentation/julep/async_julep.py +14 -14
openlit/instrumentation/julep/julep.py +14 -14
openlit/instrumentation/langchain/async_langchain.py +39 -39
openlit/instrumentation/langchain/langchain.py +39 -39
openlit/instrumentation/letta/letta.py +26 -26
openlit/instrumentation/litellm/async_litellm.py +94 -94
openlit/instrumentation/litellm/litellm.py +94 -94
openlit/instrumentation/llamaindex/llamaindex.py +7 -7
openlit/instrumentation/mem0/mem0.py +13 -13
openlit/instrumentation/milvus/milvus.py +47 -47
openlit/instrumentation/mistral/async_mistral.py +88 -88
openlit/instrumentation/mistral/mistral.py +88 -88
openlit/instrumentation/multion/async_multion.py +21 -21
openlit/instrumentation/multion/multion.py +21 -21
openlit/instrumentation/ollama/async_ollama.py +3 -3
openlit/instrumentation/ollama/ollama.py +3 -3
openlit/instrumentation/ollama/utils.py +50 -50
openlit/instrumentation/openai/async_openai.py +225 -225
openlit/instrumentation/openai/openai.py +225 -225
openlit/instrumentation/openai_agents/openai_agents.py +11 -11
openlit/instrumentation/phidata/phidata.py +15 -15
openlit/instrumentation/pinecone/pinecone.py +43 -43
openlit/instrumentation/premai/premai.py +86 -86
openlit/instrumentation/qdrant/async_qdrant.py +95 -95
openlit/instrumentation/qdrant/qdrant.py +99 -99
openlit/instrumentation/reka/async_reka.py +33 -33
openlit/instrumentation/reka/reka.py +33 -33
openlit/instrumentation/together/async_together.py +90 -90
openlit/instrumentation/together/together.py +90 -90
openlit/instrumentation/transformers/transformers.py +26 -26
openlit/instrumentation/vertexai/async_vertexai.py +64 -64
openlit/instrumentation/vertexai/vertexai.py +64 -64
openlit/instrumentation/vllm/vllm.py +24 -24
openlit/otel/metrics.py +11 -11
openlit/semcov/__init__.py +3 -3
{openlit-1.33.19.dist-info → openlit-1.33.20.dist-info}/METADATA +8 -8
openlit-1.33.20.dist-info/RECORD +131 -0
{openlit-1.33.19.dist-info → openlit-1.33.20.dist-info}/WHEEL +1 -1
openlit-1.33.19.dist-info/RECORD +0 -131
{openlit-1.33.19.dist-info → openlit-1.33.20.dist-info}/LICENSE +0 -0

openlit/instrumentation/vertexai/async_vertexai.py CHANGED Viewed

@@ -13,7 +13,7 @@ from openlit.__helpers import (
     calculate_tbt,
     create_metrics_attributes,
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -139,26 +139,26 @@ def async_send_message(version, environment, application_name, tracer,
                     # Set Span attributes (OTel Semconv)
                     self._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    self._span.set_attribute(SemanticConvention.SERVER_PORT,
                                         self._server_port)
                     inference_config = self._kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -168,19 +168,19 @@ def async_send_message(version, environment, application_name, tracer,
                         if value is not None:
                             self._span.set_attribute(attribute, value)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         self._input_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    self._span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         self._server_address)
                     if isinstance(self._llmresponse, str):
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -188,29 +188,29 @@ def async_send_message(version, environment, application_name, tracer,
                                         environment)
                     self._span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         True)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         self._input_tokens + self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT,
                                         self._tbt)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         self._ttft)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
                             },
                         )
                     self._span.set_status(Status(StatusCode.OK))
@@ -219,8 +219,8 @@ def async_send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=self._request_model,
                             server_address=self._server_address,
                             server_port=self._server_port,
@@ -280,7 +280,7 @@ def async_send_message(version, environment, application_name, tracer,
         server_address, server_port = location + '-aiplatform.googleapis.com', 443
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -342,26 +342,26 @@ def async_send_message(version, environment, application_name, tracer,
                     # Set base span attribues (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
                     inference_config = kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -371,15 +371,15 @@ def async_send_message(version, environment, application_name, tracer,
                         if value is not None:
                             span.set_attribute(attribute, value)
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
-                    # span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                    # span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                     #                     [str(response.candidates[0].finish_reason)])
                     # Set base span attribues (Extras)
@@ -387,35 +387,35 @@ def async_send_message(version, environment, application_name, tracer,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         False)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         end_time - start_time)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: response.text,
                             },
                         )
                         if isinstance(response.text, str):
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "text")
                         elif response.text is not None:
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "json")
                     span.set_status(Status(StatusCode.OK))
@@ -424,8 +424,8 @@ def async_send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=request_model,
                             server_address=server_address,
                             server_port=server_port,

openlit/instrumentation/vertexai/vertexai.py CHANGED Viewed

@@ -13,7 +13,7 @@ from openlit.__helpers import (
     calculate_tbt,
     create_metrics_attributes,
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -139,26 +139,26 @@ def send_message(version, environment, application_name, tracer,
                     # Set Span attributes (OTel Semconv)
                     self._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    self._span.set_attribute(SemanticConvention.SERVER_PORT,
                                         self._server_port)
                     inference_config = self._kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -168,19 +168,19 @@ def send_message(version, environment, application_name, tracer,
                         if value is not None:
                             self._span.set_attribute(attribute, value)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         self._input_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    self._span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         self._server_address)
                     if isinstance(self._llmresponse, str):
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -188,29 +188,29 @@ def send_message(version, environment, application_name, tracer,
                                         environment)
                     self._span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         True)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         self._input_tokens + self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT,
                                         self._tbt)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         self._ttft)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
                             },
                         )
                     self._span.set_status(Status(StatusCode.OK))
@@ -219,8 +219,8 @@ def send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=self._request_model,
                             server_address=self._server_address,
                             server_port=self._server_port,
@@ -280,7 +280,7 @@ def send_message(version, environment, application_name, tracer,
         server_address, server_port = location + '-aiplatform.googleapis.com', 443
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -342,26 +342,26 @@ def send_message(version, environment, application_name, tracer,
                     # Set base span attribues (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_VERTEXAI)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
                     inference_config = kwargs.get('generation_config', {})
                     # List of attributes and their config keys
                     attributes = [
-                        (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
-                        (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                        (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                        (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                        (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_output_tokens'),
+                        (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                        (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                        (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                        (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                     ]
                     # Set each attribute if the corresponding value exists and is not None
@@ -371,15 +371,15 @@ def send_message(version, environment, application_name, tracer,
                         if value is not None:
                             span.set_attribute(attribute, value)
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
-                    # span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                    # span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                     #                     [str(response.candidates[0].finish_reason)])
                     # Set base span attribues (Extras)
@@ -387,35 +387,35 @@ def send_message(version, environment, application_name, tracer,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         False)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         end_time - start_time)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: response.text,
                             },
                         )
                         if isinstance(response.text, str):
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "text")
                         elif response.text is not None:
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "json")
                     span.set_status(Status(StatusCode.OK))
@@ -424,8 +424,8 @@ def send_message(version, environment, application_name, tracer,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_VERTEXAI,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_VERTEXAI,
                             request_model=request_model,
                             server_address=server_address,
                             server_port=server_port,

openlit/instrumentation/vllm/vllm.py CHANGED Viewed

@@ -13,7 +13,7 @@ from openlit.__helpers import (
     create_metrics_attributes,
     set_server_address_and_port
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -55,7 +55,7 @@ def generate(version, environment, application_name,
         server_address, server_port = set_server_address_and_port(instance, "api.cohere.com", 443)
         request_model = instance.llm_engine.model_config.model or "facebook/opt-125m"
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=line-too-long
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
@@ -66,19 +66,19 @@ def generate(version, environment, application_name,
             try:
                 # Set base span attribues
                 span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                    SemanticConvetion.GEN_AI_SYSTEM_VLLM)
-                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                span.set_attribute(SemanticConvetion.SERVER_PORT,
+                span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                    SemanticConvention.GEN_AI_SYSTEM_VLLM)
+                span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                    SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                span.set_attribute(SemanticConvention.SERVER_PORT,
                                     server_port)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                     request_model)
-                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                     request_model)
-                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                     server_address)
-                span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                     "text")
                 # Set base span attribues (Extras)
@@ -86,11 +86,11 @@ def generate(version, environment, application_name,
                                      environment)
                 span.set_attribute(SERVICE_NAME,
                                     application_name)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                     False)
-                span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                     end_time - start_time)
-                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                     version)
                 input_tokens = 0
@@ -102,34 +102,34 @@ def generate(version, environment, application_name,
                     completion_attributes = {}
                     for i, output in enumerate(response):
-                        prompt_attributes[f"{SemanticConvetion.GEN_AI_CONTENT_PROMPT}.{i}"] = output.prompt
-                        completion_attributes[f"{SemanticConvetion.GEN_AI_CONTENT_COMPLETION}.{i}"] = output.outputs[0].text
+                        prompt_attributes[f"{SemanticConvention.GEN_AI_CONTENT_PROMPT}.{i}"] = output.prompt
+                        completion_attributes[f"{SemanticConvention.GEN_AI_CONTENT_COMPLETION}.{i}"] = output.outputs[0].text
                         input_tokens += general_tokens(output.prompt)
                         output_tokens += general_tokens(output.outputs[0].text)
                     # Add a single event for all prompts
                     span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                        name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                         attributes=prompt_attributes,
                     )
                     # Add a single event for all completions
                     span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                        name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                         attributes=completion_attributes,
                     )
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                     input_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                     output_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                     input_tokens + output_tokens)
                 # Calculate cost of the operation
                 cost = get_chat_model_cost(request_model, pricing_info,
                                             input_tokens, output_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                     cost)
                 span.set_status(Status(StatusCode.OK))
@@ -138,8 +138,8 @@ def generate(version, environment, application_name,
                     attributes = create_metrics_attributes(
                         service_name=application_name,
                         deployment_environment=environment,
-                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                        system=SemanticConvetion.GEN_AI_SYSTEM_VLLM,
+                        operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                        system=SemanticConvention.GEN_AI_SYSTEM_VLLM,
                         request_model=request_model,
                         server_address=server_address,
                         server_port=server_port,

openlit 1.33.19__py3-none-any.whl → 1.33.20__py3-none-any.whl

openlit 1.33.19py3-none-any.whl → 1.33.20py3-none-any.whl