PyPI - openlit - Versions diffs - 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl - Mend

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

openlit/__helpers.py +64 -7
openlit/__init__.py +3 -3
openlit/evals/utils.py +7 -7
openlit/guard/utils.py +7 -7
openlit/instrumentation/ag2/ag2.py +24 -24
openlit/instrumentation/ai21/ai21.py +3 -3
openlit/instrumentation/ai21/async_ai21.py +3 -3
openlit/instrumentation/ai21/utils.py +59 -59
openlit/instrumentation/anthropic/anthropic.py +2 -2
openlit/instrumentation/anthropic/async_anthropic.py +2 -2
openlit/instrumentation/anthropic/utils.py +34 -34
openlit/instrumentation/assemblyai/assemblyai.py +24 -24
openlit/instrumentation/astra/astra.py +3 -3
openlit/instrumentation/astra/async_astra.py +3 -3
openlit/instrumentation/astra/utils.py +39 -39
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/utils.py +36 -36
openlit/instrumentation/bedrock/bedrock.py +2 -2
openlit/instrumentation/bedrock/utils.py +35 -35
openlit/instrumentation/chroma/chroma.py +57 -57
openlit/instrumentation/cohere/async_cohere.py +88 -88
openlit/instrumentation/cohere/cohere.py +88 -88
openlit/instrumentation/controlflow/controlflow.py +15 -15
openlit/instrumentation/crawl4ai/async_crawl4ai.py +14 -14
openlit/instrumentation/crawl4ai/crawl4ai.py +14 -14
openlit/instrumentation/crewai/crewai.py +22 -22
openlit/instrumentation/dynamiq/dynamiq.py +19 -19
openlit/instrumentation/elevenlabs/async_elevenlabs.py +24 -25
openlit/instrumentation/elevenlabs/elevenlabs.py +23 -25
openlit/instrumentation/embedchain/embedchain.py +15 -15
openlit/instrumentation/firecrawl/firecrawl.py +10 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +33 -33
openlit/instrumentation/google_ai_studio/google_ai_studio.py +33 -33
openlit/instrumentation/gpt4all/gpt4all.py +78 -78
openlit/instrumentation/gpu/__init__.py +8 -8
openlit/instrumentation/groq/async_groq.py +74 -74
openlit/instrumentation/groq/groq.py +74 -74
openlit/instrumentation/haystack/haystack.py +6 -6
openlit/instrumentation/julep/async_julep.py +14 -14
openlit/instrumentation/julep/julep.py +14 -14
openlit/instrumentation/langchain/async_langchain.py +39 -39
openlit/instrumentation/langchain/langchain.py +39 -39
openlit/instrumentation/letta/letta.py +26 -26
openlit/instrumentation/litellm/async_litellm.py +94 -94
openlit/instrumentation/litellm/litellm.py +94 -94
openlit/instrumentation/llamaindex/llamaindex.py +7 -7
openlit/instrumentation/mem0/mem0.py +13 -13
openlit/instrumentation/milvus/milvus.py +47 -47
openlit/instrumentation/mistral/async_mistral.py +88 -88
openlit/instrumentation/mistral/mistral.py +88 -88
openlit/instrumentation/multion/async_multion.py +21 -21
openlit/instrumentation/multion/multion.py +21 -21
openlit/instrumentation/ollama/__init__.py +47 -34
openlit/instrumentation/ollama/async_ollama.py +7 -5
openlit/instrumentation/ollama/ollama.py +7 -5
openlit/instrumentation/ollama/utils.py +58 -54
openlit/instrumentation/openai/async_openai.py +225 -225
openlit/instrumentation/openai/openai.py +225 -225
openlit/instrumentation/openai_agents/openai_agents.py +11 -11
openlit/instrumentation/phidata/phidata.py +15 -15
openlit/instrumentation/pinecone/pinecone.py +43 -43
openlit/instrumentation/premai/premai.py +86 -86
openlit/instrumentation/qdrant/async_qdrant.py +95 -95
openlit/instrumentation/qdrant/qdrant.py +99 -99
openlit/instrumentation/reka/async_reka.py +33 -33
openlit/instrumentation/reka/reka.py +33 -33
openlit/instrumentation/together/async_together.py +90 -90
openlit/instrumentation/together/together.py +90 -90
openlit/instrumentation/transformers/__init__.py +11 -7
openlit/instrumentation/transformers/transformers.py +32 -168
openlit/instrumentation/transformers/utils.py +183 -0
openlit/instrumentation/vertexai/async_vertexai.py +64 -64
openlit/instrumentation/vertexai/vertexai.py +64 -64
openlit/instrumentation/vllm/vllm.py +24 -24
openlit/otel/metrics.py +11 -11
openlit/semcov/__init__.py +3 -3
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/METADATA +8 -8
openlit-1.33.21.dist-info/RECORD +132 -0
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/WHEEL +1 -1
openlit-1.33.19.dist-info/RECORD +0 -131
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/LICENSE +0 -0

openlit/instrumentation/google_ai_studio/google_ai_studio.py CHANGED Viewed

@@ -13,7 +13,7 @@ from openlit.__helpers import (
     create_metrics_attributes,
     set_server_address_and_port
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -56,7 +56,7 @@ def generate(version, environment, application_name,
         server_address, server_port = set_server_address_and_port(instance, "generativelanguage.googleapis.com", 443)
         request_model = kwargs.get("model", "gemini-2.0-flash")
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         with tracer.start_as_current_span(span_name, kind=SpanKind.CLIENT) as span:
             start_time = time.time()
@@ -110,26 +110,26 @@ def generate(version, environment, application_name,
                 # Set base span attribues (OTel Semconv)
                 span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                    SemanticConvetion.GEN_AI_SYSTEM_GEMINI)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                    SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                    SemanticConvention.GEN_AI_SYSTEM_GEMINI)
+                span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                     request_model)
-                span.set_attribute(SemanticConvetion.SERVER_PORT,
+                span.set_attribute(SemanticConvention.SERVER_PORT,
                                     server_port)
                 inference_config = kwargs.get('config', {})
                 # List of attributes and their config keys
                 attributes = [
-                    (SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
-                    (SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
-                    (SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
-                    (SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
-                    (SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
-                    (SemanticConvetion.GEN_AI_REQUEST_TOP_P, 'top_p'),
-                    (SemanticConvetion.GEN_AI_REQUEST_TOP_K, 'top_k'),
+                    (SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY, 'frequency_penalty'),
+                    (SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS, 'max_tokens'),
+                    (SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY, 'presence_penalty'),
+                    (SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES, 'stop_sequences'),
+                    (SemanticConvention.GEN_AI_REQUEST_TEMPERATURE, 'temperature'),
+                    (SemanticConvention.GEN_AI_REQUEST_TOP_P, 'top_p'),
+                    (SemanticConvention.GEN_AI_REQUEST_TOP_K, 'top_k'),
                 ]
                 # Set each attribute if the corresponding value exists and is not None
@@ -139,15 +139,15 @@ def generate(version, environment, application_name,
                     if value is not None:
                         span.set_attribute(attribute, value)
-                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                     response_dict.get('model_version'))
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                     input_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                     output_tokens)
-                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                     server_address)
-                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                                     [str(response_dict.get('candidates')[0].get('finish_reason'))])
                 # Set base span attribues (Extras)
@@ -155,35 +155,35 @@ def generate(version, environment, application_name,
                                     environment)
                 span.set_attribute(SERVICE_NAME,
                                     application_name)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                     False)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                     input_tokens + output_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                     cost)
-                span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                     end_time - start_time)
-                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                     version)
                 if capture_message_content:
                     span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                        name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                         attributes={
-                            SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                            SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                         },
                     )
                     span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                        name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                         attributes={
-                            SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response.text,
+                            SemanticConvention.GEN_AI_CONTENT_COMPLETION: response.text,
                         },
                     )
                     if isinstance(response_dict.get('text'), str):
-                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     elif response_dict.get('text') is not None:
-                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                 span.set_status(Status(StatusCode.OK))
@@ -192,8 +192,8 @@ def generate(version, environment, application_name,
                     attributes = create_metrics_attributes(
                         service_name=application_name,
                         deployment_environment=environment,
-                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                        system=SemanticConvetion.GEN_AI_SYSTEM_GEMINI,
+                        operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                        system=SemanticConvention.GEN_AI_SYSTEM_GEMINI,
                         request_model=request_model,
                         server_address=server_address,
                         server_port=server_port,

openlit/instrumentation/gpt4all/gpt4all.py CHANGED Viewed

@@ -14,7 +14,7 @@ from openlit.__helpers import (
     calculate_tbt,
     calculate_ttft
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -116,39 +116,39 @@ def generate(version, environment, application_name,
                     # Set Span attributes (OTel Semconv)
                     self._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_GPT4ALL)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    self._span.set_attribute(SemanticConvention.SERVER_PORT,
                                         self._server_port)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
                                         self._kwargs.get("repeat_penalty", 1.18))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
                                         self._kwargs.get("max_tokens", 200))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
                                         self._kwargs.get("presence_penalty", 0.0))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
                                         self._kwargs.get("temp", 0.7))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P,
                                         self._kwargs.get("top_p", 0.4))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_K,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_K,
                                         self._kwargs.get("top_k", 40))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         self._request_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    self._span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         self._server_address)
                     if isinstance(self._llmresponse, str):
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -156,29 +156,29 @@ def generate(version, environment, application_name,
                                         environment)
                     self._span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         True)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT,
                                         self._tbt)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         self._ttft)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         0)
                     if capture_message_content:
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
                             },
                         )
@@ -188,8 +188,8 @@ def generate(version, environment, application_name,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
                             request_model=self._request_model,
                             server_address=self._server_address,
                             server_port=self._server_port,
@@ -243,7 +243,7 @@ def generate(version, environment, application_name,
         server_address, server_port = set_server_address_and_port(instance, "localhost", 80)
         request_model = str(instance.model.model_path).rsplit('/', maxsplit=1)[-1] or "orca-mini-3b-gguf2-q4_0.gguf"
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -269,39 +269,39 @@ def generate(version, environment, application_name,
                     # Set Span attributes (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_GPT4ALL)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
                                         kwargs.get("repeat_penalty", 1.18))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
                                         kwargs.get("max_tokens", 200))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
                                         kwargs.get("presence_penalty", 0.0))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
                                         kwargs.get("temp", 0.7))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P,
                                         kwargs.get("top_p", 0.4))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_K,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_K,
                                         kwargs.get("top_k", 40))
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
                     if isinstance(response, str):
-                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -309,27 +309,27 @@ def generate(version, environment, application_name,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         False)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         end_time - start_time)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         0)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: response,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: response,
                             },
                         )
@@ -339,8 +339,8 @@ def generate(version, environment, application_name,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
                             request_model=request_model,
                             server_address=server_address,
                             server_port=server_port,
@@ -412,7 +412,7 @@ def embed(version, environment, application_name,
         # pylint: disable=line-too-long
         request_model = str(instance.gpt4all.model.model_path).rsplit('/', maxsplit=1)[-1] or "all-MiniLM-L6-v2.gguf2.f16.gguf"
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING} {request_model}"
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
             start_time = time.time()
@@ -425,19 +425,19 @@ def embed(version, environment, application_name,
                 # Set Span attributes (OTel Semconv)
                 span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                    SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING)
-                span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                    SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                    SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING)
+                span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                    SemanticConvention.GEN_AI_SYSTEM_GPT4ALL)
+                span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                     request_model)
-                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                     request_model)
-                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                     server_address)
-                span.set_attribute(SemanticConvetion.SERVER_PORT,
+                span.set_attribute(SemanticConvention.SERVER_PORT,
                                     server_port)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                     input_tokens)
                 # Set Span attributes (Extras)
@@ -445,18 +445,18 @@ def embed(version, environment, application_name,
                                     environment)
                 span.set_attribute(SERVICE_NAME,
                                     application_name)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                     input_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                     version)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                     0)
                 if capture_message_content:
                     span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                        name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                         attributes={
-                            SemanticConvetion.GEN_AI_CONTENT_PROMPT: str(kwargs.get("input", "")),
+                            SemanticConvention.GEN_AI_CONTENT_PROMPT: str(kwargs.get("input", "")),
                         },
                     )
@@ -466,8 +466,8 @@ def embed(version, environment, application_name,
                     attributes = create_metrics_attributes(
                         service_name=application_name,
                         deployment_environment=environment,
-                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_EMBEDDING,
-                        system=SemanticConvetion.GEN_AI_SYSTEM_GPT4ALL,
+                        operation=SemanticConvention.GEN_AI_OPERATION_TYPE_EMBEDDING,
+                        system=SemanticConvention.GEN_AI_SYSTEM_GPT4ALL,
                         request_model=request_model,
                         server_address=server_address,
                         server_port=server_port,

openlit/instrumentation/gpu/__init__.py CHANGED Viewed

@@ -7,7 +7,7 @@ from functools import partial
 from opentelemetry.instrumentation.instrumentor import BaseInstrumentor
 from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
 from opentelemetry.metrics import get_meter, CallbackOptions, Observation
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -54,7 +54,7 @@ class GPUInstrumentor(BaseInstrumentor):
         for semantic_name, internal_name in metric_names:
             meter.create_observable_gauge(
-                name=getattr(SemanticConvetion, semantic_name),
+                name=getattr(SemanticConvention, semantic_name),
                 callbacks=[partial(self._collect_metric,
                                    environment, application_name, internal_name)],
                 description=f"GPU {internal_name.replace('_', ' ').title()}",
@@ -141,9 +141,9 @@ class GPUInstrumentor(BaseInstrumentor):
                     TELEMETRY_SDK_NAME: "openlit",
                     SERVICE_NAME: application_name,
                     DEPLOYMENT_ENVIRONMENT: environment,
-                    SemanticConvetion.GPU_INDEX: str(gpu_index),
-                    SemanticConvetion.GPU_UUID: safe_decode(pynvml.nvmlDeviceGetUUID(handle)),
-                    SemanticConvetion.GPU_NAME: safe_decode(pynvml.nvmlDeviceGetName(handle))
+                    SemanticConvention.GPU_INDEX: str(gpu_index),
+                    SemanticConvention.GPU_UUID: safe_decode(pynvml.nvmlDeviceGetUUID(handle)),
+                    SemanticConvention.GPU_NAME: safe_decode(pynvml.nvmlDeviceGetName(handle))
                 }
                 yield Observation(get_metric_value(handle, metric_name), attributes)
@@ -202,10 +202,10 @@ class GPUInstrumentor(BaseInstrumentor):
                     SERVICE_NAME: application_name,
                     DEPLOYMENT_ENVIRONMENT: environment,
                     # pylint: disable=line-too-long
-                    SemanticConvetion.GPU_INDEX: amdsmi.amdsmi_get_xgmi_info(device_handle)['index'],
+                    SemanticConvention.GPU_INDEX: amdsmi.amdsmi_get_xgmi_info(device_handle)['index'],
                     # pylint: disable=line-too-long
-                    SemanticConvetion.GPU_UUID: amdsmi.amdsmi_get_gpu_asic_info(device_handle)['market_name'],
-                    SemanticConvetion.GPU_NAME: amdsmi.amdsmi_get_device_name(device_handle)
+                    SemanticConvention.GPU_UUID: amdsmi.amdsmi_get_gpu_asic_info(device_handle)['market_name'],
+                    SemanticConvention.GPU_NAME: amdsmi.amdsmi_get_device_name(device_handle)
                 }
                 yield Observation(get_metric_value(device_handle, metric_name), attributes)

openlit 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl