PyPI - openlit - Versions diffs - 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl - Mend

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

openlit/__helpers.py +64 -7
openlit/__init__.py +3 -3
openlit/evals/utils.py +7 -7
openlit/guard/utils.py +7 -7
openlit/instrumentation/ag2/ag2.py +24 -24
openlit/instrumentation/ai21/ai21.py +3 -3
openlit/instrumentation/ai21/async_ai21.py +3 -3
openlit/instrumentation/ai21/utils.py +59 -59
openlit/instrumentation/anthropic/anthropic.py +2 -2
openlit/instrumentation/anthropic/async_anthropic.py +2 -2
openlit/instrumentation/anthropic/utils.py +34 -34
openlit/instrumentation/assemblyai/assemblyai.py +24 -24
openlit/instrumentation/astra/astra.py +3 -3
openlit/instrumentation/astra/async_astra.py +3 -3
openlit/instrumentation/astra/utils.py +39 -39
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +2 -2
openlit/instrumentation/azure_ai_inference/utils.py +36 -36
openlit/instrumentation/bedrock/bedrock.py +2 -2
openlit/instrumentation/bedrock/utils.py +35 -35
openlit/instrumentation/chroma/chroma.py +57 -57
openlit/instrumentation/cohere/async_cohere.py +88 -88
openlit/instrumentation/cohere/cohere.py +88 -88
openlit/instrumentation/controlflow/controlflow.py +15 -15
openlit/instrumentation/crawl4ai/async_crawl4ai.py +14 -14
openlit/instrumentation/crawl4ai/crawl4ai.py +14 -14
openlit/instrumentation/crewai/crewai.py +22 -22
openlit/instrumentation/dynamiq/dynamiq.py +19 -19
openlit/instrumentation/elevenlabs/async_elevenlabs.py +24 -25
openlit/instrumentation/elevenlabs/elevenlabs.py +23 -25
openlit/instrumentation/embedchain/embedchain.py +15 -15
openlit/instrumentation/firecrawl/firecrawl.py +10 -10
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +33 -33
openlit/instrumentation/google_ai_studio/google_ai_studio.py +33 -33
openlit/instrumentation/gpt4all/gpt4all.py +78 -78
openlit/instrumentation/gpu/__init__.py +8 -8
openlit/instrumentation/groq/async_groq.py +74 -74
openlit/instrumentation/groq/groq.py +74 -74
openlit/instrumentation/haystack/haystack.py +6 -6
openlit/instrumentation/julep/async_julep.py +14 -14
openlit/instrumentation/julep/julep.py +14 -14
openlit/instrumentation/langchain/async_langchain.py +39 -39
openlit/instrumentation/langchain/langchain.py +39 -39
openlit/instrumentation/letta/letta.py +26 -26
openlit/instrumentation/litellm/async_litellm.py +94 -94
openlit/instrumentation/litellm/litellm.py +94 -94
openlit/instrumentation/llamaindex/llamaindex.py +7 -7
openlit/instrumentation/mem0/mem0.py +13 -13
openlit/instrumentation/milvus/milvus.py +47 -47
openlit/instrumentation/mistral/async_mistral.py +88 -88
openlit/instrumentation/mistral/mistral.py +88 -88
openlit/instrumentation/multion/async_multion.py +21 -21
openlit/instrumentation/multion/multion.py +21 -21
openlit/instrumentation/ollama/__init__.py +47 -34
openlit/instrumentation/ollama/async_ollama.py +7 -5
openlit/instrumentation/ollama/ollama.py +7 -5
openlit/instrumentation/ollama/utils.py +58 -54
openlit/instrumentation/openai/async_openai.py +225 -225
openlit/instrumentation/openai/openai.py +225 -225
openlit/instrumentation/openai_agents/openai_agents.py +11 -11
openlit/instrumentation/phidata/phidata.py +15 -15
openlit/instrumentation/pinecone/pinecone.py +43 -43
openlit/instrumentation/premai/premai.py +86 -86
openlit/instrumentation/qdrant/async_qdrant.py +95 -95
openlit/instrumentation/qdrant/qdrant.py +99 -99
openlit/instrumentation/reka/async_reka.py +33 -33
openlit/instrumentation/reka/reka.py +33 -33
openlit/instrumentation/together/async_together.py +90 -90
openlit/instrumentation/together/together.py +90 -90
openlit/instrumentation/transformers/__init__.py +11 -7
openlit/instrumentation/transformers/transformers.py +32 -168
openlit/instrumentation/transformers/utils.py +183 -0
openlit/instrumentation/vertexai/async_vertexai.py +64 -64
openlit/instrumentation/vertexai/vertexai.py +64 -64
openlit/instrumentation/vllm/vllm.py +24 -24
openlit/otel/metrics.py +11 -11
openlit/semcov/__init__.py +3 -3
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/METADATA +8 -8
openlit-1.33.21.dist-info/RECORD +132 -0
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/WHEEL +1 -1
openlit-1.33.19.dist-info/RECORD +0 -131
{openlit-1.33.19.dist-info → openlit-1.33.21.dist-info}/LICENSE +0 -0

openlit/instrumentation/together/together.py CHANGED Viewed

@@ -16,7 +16,7 @@ from openlit.__helpers import (
     create_metrics_attributes,
     set_server_address_and_port
 )
-from openlit.semcov import SemanticConvetion
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
@@ -157,46 +157,46 @@ def completion(version, environment, application_name,
                     # Set Span attributes (OTel Semconv)
                     self._span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_TOGETHER)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_TOGETHER)
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_SEED,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_SEED,
                                         self._kwargs.get("seed", ""))
-                    self._span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    self._span.set_attribute(SemanticConvention.SERVER_PORT,
                                         self._server_port)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
                                         self._kwargs.get("frequency_penalty", 0.0))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
                                         self._kwargs.get("max_tokens", -1))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
                                         self._kwargs.get("presence_penalty", 0.0))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES,
                                         self._kwargs.get("stop", []))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
                                         self._kwargs.get("temperature", 1.0))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P,
                                         self._kwargs.get("top_p", 1.0))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                                         [self._finish_reason])
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_ID,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID,
                                         self._response_id)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         self._response_model)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         self._input_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    self._span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         self._server_address)
                     if isinstance(self._llmresponse, str):
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "text")
                     else:
-                        self._span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                        self._span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "json")
                     # Set Span attributes (Extra)
@@ -204,31 +204,31 @@ def completion(version, environment, application_name,
                                         environment)
                     self._span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_USER,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_USER,
                                         self._kwargs.get("user", ""))
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         True)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         self._input_tokens + self._output_tokens)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TBT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TBT,
                                         self._tbt)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         self._ttft)
-                    self._span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    self._span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                         self._span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: self._llmresponse,
                             },
                         )
                     self._span.set_status(Status(StatusCode.OK))
@@ -237,8 +237,8 @@ def completion(version, environment, application_name,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_TOGETHER,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_TOGETHER,
                             request_model=request_model,
                             server_address=self._server_address,
                             server_port=self._server_port,
@@ -290,7 +290,7 @@ def completion(version, environment, application_name,
         server_address, server_port = set_server_address_and_port(instance, "api.together.xyz", 443)
         request_model = kwargs.get("model", "gpt-4o")
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         # pylint: disable=no-else-return
         if streaming:
@@ -338,37 +338,37 @@ def completion(version, environment, application_name,
                     # Set base span attribues (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_TOGETHER)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_TOGETHER)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_SEED,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_SEED,
                                         kwargs.get("seed", ""))
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_FREQUENCY_PENALTY,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_FREQUENCY_PENALTY,
                                         kwargs.get("frequency_penalty", 0.0))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MAX_TOKENS,
                                         kwargs.get("max_tokens", -1))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_PRESENCE_PENALTY,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_PRESENCE_PENALTY,
                                         kwargs.get("presence_penalty", 0.0))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_STOP_SEQUENCES,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_STOP_SEQUENCES,
                                         kwargs.get("stop", []))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TEMPERATURE,
                                         kwargs.get("temperature", 1.0))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_TOP_P,
                                         kwargs.get("top_p", 1.0))
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_ID,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID,
                                         response_dict.get("id"))
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         response_dict.get('model'))
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_INPUT_TOKENS,
                                         input_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_OUTPUT_TOKENS,
                                         output_tokens)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
                     # Set base span attribues (Extras)
@@ -376,46 +376,46 @@ def completion(version, environment, application_name,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_USER,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_USER,
                                         kwargs.get("user", ""))
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IS_STREAM,
                                         False)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_TOTAL_TOKENS,
                                         input_tokens + output_tokens)
-                    span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                    span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                         cost)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                    span.set_attribute(SemanticConvention.GEN_AI_SERVER_TTFT,
                                         end_time - start_time)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: prompt,
                             },
                         )
                     for i in range(kwargs.get('n',1)):
-                        span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_FINISH_REASON,
+                        span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_FINISH_REASON,
                                            [str(response_dict.get('choices')[i].get('finish_reason'))])
                         if capture_message_content:
                             span.add_event(
-                                name=SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT,
+                                name=SemanticConvention.GEN_AI_CONTENT_COMPLETION_EVENT,
                                 attributes={
                                     # pylint: disable=line-too-long
-                                    SemanticConvetion.GEN_AI_CONTENT_COMPLETION: str(response_dict.get('choices')[i].get('message').get('content')),
+                                    SemanticConvention.GEN_AI_CONTENT_COMPLETION: str(response_dict.get('choices')[i].get('message').get('content')),
                                 },
                             )
                         if kwargs.get('tools'):
-                            span.set_attribute(SemanticConvetion.GEN_AI_TOOL_CALLS,
+                            span.set_attribute(SemanticConvention.GEN_AI_TOOL_CALLS,
                                             str(response_dict.get('choices')[i].get('message').get('tool_calls')))
                         if isinstance(response_dict.get('choices')[i].get('message').get('content'), str):
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "text")
                         elif response_dict.get('choices')[i].get('message').get('content') is not None:
-                            span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                            span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                             "json")
                     span.set_status(Status(StatusCode.OK))
@@ -424,8 +424,8 @@ def completion(version, environment, application_name,
                         attributes = create_metrics_attributes(
                             service_name=application_name,
                             deployment_environment=environment,
-                            operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                            system=SemanticConvetion.GEN_AI_SYSTEM_TOGETHER,
+                            operation=SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT,
+                            system=SemanticConvention.GEN_AI_SYSTEM_TOGETHER,
                             request_model=request_model,
                             server_address=server_address,
                             server_port=server_port,
@@ -495,7 +495,7 @@ def image_generate(version, environment, application_name,
         server_address, server_port = set_server_address_and_port(instance, "api.together.xyz", 443)
         request_model = kwargs.get("model", "dall-e-2")
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_IMAGE} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_IMAGE} {request_model}"
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
             start_time = time.time()
@@ -521,21 +521,21 @@ def image_generate(version, environment, application_name,
                 for items in response.data:
                     # Set Span attributes (OTel Semconv)
                     span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                    span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                        SemanticConvetion.GEN_AI_OPERATION_TYPE_IMAGE)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                        SemanticConvetion.GEN_AI_SYSTEM_TOGETHER)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_OPERATION,
+                                        SemanticConvention.GEN_AI_OPERATION_TYPE_IMAGE)
+                    span.set_attribute(SemanticConvention.GEN_AI_SYSTEM,
+                                        SemanticConvention.GEN_AI_SYSTEM_TOGETHER)
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_MODEL,
                                         request_model)
-                    span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                    span.set_attribute(SemanticConvention.SERVER_ADDRESS,
                                         server_address)
-                    span.set_attribute(SemanticConvetion.SERVER_PORT,
+                    span.set_attribute(SemanticConvention.SERVER_PORT,
                                         server_port)
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_ID,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_ID,
                                         response.id)
-                    span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                    span.set_attribute(SemanticConvention.GEN_AI_RESPONSE_MODEL,
                                         response.model)
-                    span.set_attribute(SemanticConvetion.GEN_AI_OUTPUT_TYPE,
+                    span.set_attribute(SemanticConvention.GEN_AI_OUTPUT_TYPE,
                                         "image")
                     # Set Span attributes (Extras)
@@ -543,29 +543,29 @@ def image_generate(version, environment, application_name,
                                         environment)
                     span.set_attribute(SERVICE_NAME,
                                         application_name)
-                    span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IMAGE_SIZE,
+                    span.set_attribute(SemanticConvention.GEN_AI_REQUEST_IMAGE_SIZE,
                                         image_size)
-                    span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                    span.set_attribute(SemanticConvention.GEN_AI_SDK_VERSION,
                                         version)
                     if capture_message_content:
                         span.add_event(
-                            name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
+                            name=SemanticConvention.GEN_AI_CONTENT_PROMPT_EVENT,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_PROMPT: kwargs.get("prompt", ""),
+                                SemanticConvention.GEN_AI_CONTENT_PROMPT: kwargs.get("prompt", ""),
                             },
                         )
-                        attribute_name = f"{SemanticConvetion.GEN_AI_RESPONSE_IMAGE}.{images_count}"
+                        attribute_name = f"{SemanticConvention.GEN_AI_RESPONSE_IMAGE}.{images_count}"
                         span.add_event(
                             name=attribute_name,
                             attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: getattr(items, image),
+                                SemanticConvention.GEN_AI_CONTENT_COMPLETION: getattr(items, image),
                             },
                         )
                     images_count+=1
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                span.set_attribute(SemanticConvention.GEN_AI_USAGE_COST,
                                     len(response.data) * cost)
                 span.set_status(Status(StatusCode.OK))
@@ -573,8 +573,8 @@ def image_generate(version, environment, application_name,
                     attributes = create_metrics_attributes(
                         service_name=application_name,
                         deployment_environment=environment,
-                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_IMAGE,
-                        system=SemanticConvetion.GEN_AI_SYSTEM_TOGETHER,
+                        operation=SemanticConvention.GEN_AI_OPERATION_TYPE_IMAGE,
+                        system=SemanticConvention.GEN_AI_SYSTEM_TOGETHER,
                         request_model=request_model,
                         server_address=server_address,
                         server_port=server_port,

openlit/instrumentation/transformers/__init__.py CHANGED Viewed

@@ -1,16 +1,20 @@
-# pylint: disable=useless-return, bad-staticmethod-argument, disable=duplicate-code
-"""Initializer of Auto Instrumentation of HuggingFace Transformer Functions"""
+"""
+Initializer of Auto Instrumentation of HuggingFace Transformer Functions
+"""
 from typing import Collection
 import importlib.metadata
 from opentelemetry.instrumentation.instrumentor import BaseInstrumentor
 from wrapt import wrap_function_wrapper
-from openlit.instrumentation.transformers.transformers import text_wrap
+from openlit.instrumentation.transformers.transformers import pipeline_wrapper
-_instruments = ("transformers >= 4.39.3",)
+_instruments = ("transformers >= 4.48.0",)
 class TransformersInstrumentor(BaseInstrumentor):
-    """An instrumentor for HuggingFace Transformer Functions."""
+    """
+    An instrumentor for HuggingFace Transformer library.
+    """
     def instrumentation_dependencies(self) -> Collection[str]:
         return _instruments
@@ -28,10 +32,10 @@ class TransformersInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "transformers",
             "TextGenerationPipeline.__call__",
-            text_wrap(version, environment, application_name,
+            pipeline_wrapper(version, environment, application_name,
                  tracer, pricing_info, capture_message_content, metrics, disable_metrics),
         )
-    @staticmethod
     def _uninstrument(self, **kwargs):
+        # Proper uninstrumentation logic to revert patched methods
         pass

openlit/instrumentation/transformers/transformers.py CHANGED Viewed

@@ -1,197 +1,61 @@
 """
-Module for monitoring ChromaDB.
+Module for monitoring HF Transformers API calls.
 """
 import logging
 import time
-from opentelemetry.trace import SpanKind, Status, StatusCode
-from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from opentelemetry.trace import SpanKind
 from openlit.__helpers import (
-    get_chat_model_cost,
-    handle_exception,
-    general_tokens,
-    create_metrics_attributes,
     set_server_address_and_port
 )
-from openlit.semcov import SemanticConvetion
+from openlit.instrumentation.transformers.utils import (
+    process_chat_response,
+)
+from openlit.semcov import SemanticConvention
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
-def text_wrap(version, environment, application_name,
-                 tracer, pricing_info, capture_message_content, metrics, disable_metrics):
+def pipeline_wrapper(version, environment, application_name,
+                tracer, pricing_info, capture_message_content, metrics, disable_metrics):
     """
-    Creates a wrapper around a function call to trace and log its execution metrics.
-    This function wraps any given function to measure its execution time,
-    log its operation, and trace its execution using OpenTelemetry.
-    Parameters:
-    - version (str): The version of the Langchain application.
-    - environment (str): The deployment environment (e.g., 'production', 'development').
-    - application_name (str): Name of the Langchain application.
-    - tracer (opentelemetry.trace.Tracer): The tracer object used for OpenTelemetry tracing.
-    - pricing_info (dict): Information about the pricing for internal metrics (currently not used).
-    - capture_message_content (bool): Flag indicating whether to trace the content of the response.
-    Returns:
-    - function: A higher-order function that takes a function 'wrapped' and returns
-                a new function that wraps 'wrapped' with additional tracing and logging.
+    Generates a telemetry wrapper for GenAI function call
     """
     def wrapper(wrapped, instance, args, kwargs):
         """
-        An inner wrapper function that executes the wrapped function, measures execution
-        time, and records trace data using OpenTelemetry.
-        Parameters:
-        - wrapped (Callable): The original function that this wrapper will execute.
-        - instance (object): The instance to which the wrapped function belongs. This
-                             is used for instance methods. For static and classmethods,
-                             this may be None.
-        - args (tuple): Positional arguments passed to the wrapped function.
-        - kwargs (dict): Keyword arguments passed to the wrapped function.
-        Returns:
-        - The result of the wrapped function call.
-        The wrapper initiates a span with the provided tracer, sets various attributes
-        on the span based on the function's execution and response, and ensures
-        errors are handled and logged appropriately.
+        Wraps the GenAI function call.
         """
         server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 80)
         request_model = instance.model.config.name_or_path
-        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        span_name = f"{SemanticConvention.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
         with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
             start_time = time.time()
             response = wrapped(*args, **kwargs)
-            end_time = time.time()
-            # pylint: disable=protected-access
-            forward_params = instance._forward_params
-            try:
-                if args and len(args) > 0:
-                    prompt = args[0]
-                else:
-                    prompt = kwargs.get("args", "")
-                input_tokens = general_tokens(prompt[0])
-                span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
-                                   SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
-                span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
-                                   SemanticConvetion.GEN_AI_SYSTEM_HUGGING_FACE)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
-                                   request_model)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
-                                   forward_params.get("temperature", "null"))
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
-                                   forward_params.get("top_p", "null"))
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
-                                   forward_params.get("max_length", -1))
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
-                                   input_tokens)
-                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
-                                    server_address)
-                span.set_attribute(SemanticConvetion.SERVER_PORT,
-                                    server_port)
-                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
-                                    request_model)
-                span.set_attribute(DEPLOYMENT_ENVIRONMENT,
-                                   environment)
-                span.set_attribute(SERVICE_NAME,
-                                   application_name)
-                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
-                                    False)
-                span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
-                                    end_time - start_time)
-                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
-                                    version)
-                if capture_message_content:
-                    span.add_event(
-                        name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
-                        attributes={
-                            SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
-                        },
-                    )
-                i = 0
-                output_tokens = 0
-                for completion in response:
-                    if len(response) > 1:
-                        attribute_name = f"gen_ai.content.completion.{i}"
-                    else:
-                        attribute_name = SemanticConvetion.GEN_AI_CONTENT_COMPLETION_EVENT
-                    if capture_message_content:
-                        # pylint: disable=bare-except
-                        try:
-                            llm_response = completion.get('generated_text', '')
-                        except:
-                            llm_response = completion[i].get('generated_text', '')
-                        span.add_event(
-                            name=attribute_name,
-                            attributes={
-                                SemanticConvetion.GEN_AI_CONTENT_COMPLETION: llm_response,
-                            },
-                        )
-                    output_tokens += general_tokens(llm_response)
-                    i=i+1
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
-                                   output_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
-                                   input_tokens + output_tokens)
-                # Calculate cost of the operation
-                cost = get_chat_model_cost(request_model,
-                                            pricing_info, input_tokens,
-                                            output_tokens)
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
-                                    cost)
-                span.set_status(Status(StatusCode.OK))
-                if disable_metrics is False:
-                    attributes = create_metrics_attributes(
-                        service_name=application_name,
-                        deployment_environment=environment,
-                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
-                        system=SemanticConvetion.GEN_AI_SYSTEM_HUGGING_FACE,
-                        request_model=request_model,
-                        server_address=server_address,
-                        server_port=server_port,
-                        response_model=request_model,
-                    )
-                    metrics["genai_client_usage_tokens"].record(
-                        input_tokens + output_tokens, attributes
-                    )
-                    metrics["genai_client_operation_duration"].record(
-                        end_time - start_time, attributes
-                    )
-                    metrics["genai_server_ttft"].record(
-                        end_time - start_time, attributes
-                    )
-                    metrics["genai_requests"].add(1, attributes)
-                    metrics["genai_completion_tokens"].add(output_tokens, attributes)
-                    metrics["genai_prompt_tokens"].add(input_tokens, attributes)
-                    metrics["genai_cost"].record(cost, attributes)
-                # Return original response
-                return response
-            except Exception as e:
-                handle_exception(span, e)
-                logger.error("Error in trace creation: %s", e)
-                # Return original response
-                return response
+            response = process_chat_response(
+                    instance = instance,
+                    response=response,
+                    request_model=request_model,
+                    pricing_info=pricing_info,
+                    server_port=server_port,
+                    server_address=server_address,
+                    environment=environment,
+                    application_name=application_name,
+                    metrics=metrics,
+                    start_time=start_time,
+                    span=span,
+                    args=args,
+                    kwargs=kwargs,
+                    capture_message_content=capture_message_content,
+                    disable_metrics=disable_metrics,
+                    version=version,
+            )
+        return response
     return wrapper

openlit 1.33.19__py3-none-any.whl → 1.33.21__py3-none-any.whl

openlit 1.33.19py3-none-any.whl → 1.33.21py3-none-any.whl