PyPI - openlit - Versions diffs - 1.33.8__py3-none-any.whl → 1.33.10__py3-none-any.whl - Mend

openlit 1.33.8py3-none-any.whl → 1.33.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (92) hide show

openlit/__helpers.py +88 -0
openlit/__init__.py +4 -3
openlit/instrumentation/ag2/ag2.py +5 -5
openlit/instrumentation/ai21/__init__.py +4 -4
openlit/instrumentation/ai21/ai21.py +370 -319
openlit/instrumentation/ai21/async_ai21.py +371 -319
openlit/instrumentation/anthropic/__init__.py +4 -4
openlit/instrumentation/anthropic/anthropic.py +321 -189
openlit/instrumentation/anthropic/async_anthropic.py +323 -190
openlit/instrumentation/assemblyai/__init__.py +1 -1
openlit/instrumentation/assemblyai/assemblyai.py +59 -43
openlit/instrumentation/astra/astra.py +9 -9
openlit/instrumentation/astra/async_astra.py +9 -9
openlit/instrumentation/azure_ai_inference/__init__.py +4 -4
openlit/instrumentation/azure_ai_inference/async_azure_ai_inference.py +406 -252
openlit/instrumentation/azure_ai_inference/azure_ai_inference.py +406 -252
openlit/instrumentation/bedrock/__init__.py +1 -1
openlit/instrumentation/bedrock/bedrock.py +115 -58
openlit/instrumentation/chroma/chroma.py +9 -9
openlit/instrumentation/cohere/__init__.py +33 -10
openlit/instrumentation/cohere/async_cohere.py +610 -0
openlit/instrumentation/cohere/cohere.py +410 -219
openlit/instrumentation/controlflow/controlflow.py +5 -5
openlit/instrumentation/crawl4ai/async_crawl4ai.py +5 -5
openlit/instrumentation/crawl4ai/crawl4ai.py +5 -5
openlit/instrumentation/crewai/crewai.py +6 -4
openlit/instrumentation/dynamiq/dynamiq.py +5 -5
openlit/instrumentation/elevenlabs/async_elevenlabs.py +71 -46
openlit/instrumentation/elevenlabs/elevenlabs.py +71 -51
openlit/instrumentation/embedchain/embedchain.py +9 -9
openlit/instrumentation/firecrawl/firecrawl.py +5 -5
openlit/instrumentation/google_ai_studio/__init__.py +9 -9
openlit/instrumentation/google_ai_studio/async_google_ai_studio.py +183 -219
openlit/instrumentation/google_ai_studio/google_ai_studio.py +183 -220
openlit/instrumentation/gpt4all/__init__.py +2 -2
openlit/instrumentation/gpt4all/gpt4all.py +345 -220
openlit/instrumentation/gpu/__init__.py +5 -5
openlit/instrumentation/groq/__init__.py +2 -2
openlit/instrumentation/groq/async_groq.py +356 -240
openlit/instrumentation/groq/groq.py +356 -240
openlit/instrumentation/haystack/haystack.py +5 -5
openlit/instrumentation/julep/async_julep.py +5 -5
openlit/instrumentation/julep/julep.py +5 -5
openlit/instrumentation/langchain/__init__.py +13 -7
openlit/instrumentation/langchain/async_langchain.py +384 -0
openlit/instrumentation/langchain/langchain.py +105 -492
openlit/instrumentation/letta/letta.py +11 -9
openlit/instrumentation/litellm/__init__.py +4 -5
openlit/instrumentation/litellm/async_litellm.py +318 -247
openlit/instrumentation/litellm/litellm.py +314 -243
openlit/instrumentation/llamaindex/llamaindex.py +5 -5
openlit/instrumentation/mem0/mem0.py +5 -5
openlit/instrumentation/milvus/milvus.py +9 -9
openlit/instrumentation/mistral/__init__.py +6 -6
openlit/instrumentation/mistral/async_mistral.py +423 -250
openlit/instrumentation/mistral/mistral.py +420 -246
openlit/instrumentation/multion/async_multion.py +6 -4
openlit/instrumentation/multion/multion.py +6 -4
openlit/instrumentation/ollama/__init__.py +8 -30
openlit/instrumentation/ollama/async_ollama.py +385 -417
openlit/instrumentation/ollama/ollama.py +384 -417
openlit/instrumentation/openai/__init__.py +11 -230
openlit/instrumentation/openai/async_openai.py +433 -410
openlit/instrumentation/openai/openai.py +414 -394
openlit/instrumentation/phidata/phidata.py +6 -4
openlit/instrumentation/pinecone/pinecone.py +9 -9
openlit/instrumentation/premai/__init__.py +2 -2
openlit/instrumentation/premai/premai.py +262 -213
openlit/instrumentation/qdrant/async_qdrant.py +9 -9
openlit/instrumentation/qdrant/qdrant.py +9 -9
openlit/instrumentation/reka/__init__.py +2 -2
openlit/instrumentation/reka/async_reka.py +90 -52
openlit/instrumentation/reka/reka.py +90 -52
openlit/instrumentation/together/__init__.py +4 -4
openlit/instrumentation/together/async_together.py +278 -236
openlit/instrumentation/together/together.py +278 -236
openlit/instrumentation/transformers/__init__.py +1 -1
openlit/instrumentation/transformers/transformers.py +76 -45
openlit/instrumentation/vertexai/__init__.py +14 -64
openlit/instrumentation/vertexai/async_vertexai.py +330 -987
openlit/instrumentation/vertexai/vertexai.py +330 -987
openlit/instrumentation/vllm/__init__.py +1 -1
openlit/instrumentation/vllm/vllm.py +66 -36
openlit/otel/metrics.py +98 -7
openlit/semcov/__init__.py +113 -80
{openlit-1.33.8.dist-info → openlit-1.33.10.dist-info}/METADATA +1 -1
openlit-1.33.10.dist-info/RECORD +122 -0
{openlit-1.33.8.dist-info → openlit-1.33.10.dist-info}/WHEEL +1 -1
openlit/instrumentation/openai/async_azure_openai.py +0 -900
openlit/instrumentation/openai/azure_openai.py +0 -898
openlit-1.33.8.dist-info/RECORD +0 -122
{openlit-1.33.8.dist-info → openlit-1.33.10.dist-info}/LICENSE +0 -0

openlit/instrumentation/transformers/__init__.py CHANGED Viewed

@@ -28,7 +28,7 @@ class TransformersInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "transformers",
             "TextGenerationPipeline.__call__",
-            text_wrap("huggingface.text_generation", version, environment, application_name,
+            text_wrap(version, environment, application_name,
                  tracer, pricing_info, trace_content, metrics, disable_metrics),
         )

openlit/instrumentation/transformers/transformers.py CHANGED Viewed

@@ -1,18 +1,24 @@
-# pylint: disable=duplicate-code, broad-exception-caught, too-many-statements, unused-argument
 """
 Module for monitoring ChromaDB.
 """
 import logging
+import time
 from opentelemetry.trace import SpanKind, Status, StatusCode
-from opentelemetry.sdk.resources import TELEMETRY_SDK_NAME
-from openlit.__helpers import handle_exception, general_tokens
+from opentelemetry.sdk.resources import SERVICE_NAME, TELEMETRY_SDK_NAME, DEPLOYMENT_ENVIRONMENT
+from openlit.__helpers import (
+    get_chat_model_cost,
+    handle_exception,
+    general_tokens,
+    create_metrics_attributes,
+    set_server_address_and_port
+)
 from openlit.semcov import SemanticConvetion
 # Initialize logger for logging potential issues and operations
 logger = logging.getLogger(__name__)
-def text_wrap(gen_ai_endpoint, version, environment, application_name,
+def text_wrap(version, environment, application_name,
                  tracer, pricing_info, trace_content, metrics, disable_metrics):
     """
     Creates a wrapper around a function call to trace and log its execution metrics.
@@ -21,7 +27,6 @@ def text_wrap(gen_ai_endpoint, version, environment, application_name,
     log its operation, and trace its execution using OpenTelemetry.
     Parameters:
-    - gen_ai_endpoint (str): A descriptor or name for the endpoint being traced.
     - version (str): The version of the Langchain application.
     - environment (str): The deployment environment (e.g., 'production', 'development').
     - application_name (str): Name of the Langchain application.
@@ -55,8 +60,15 @@ def text_wrap(gen_ai_endpoint, version, environment, application_name,
         errors are handled and logged appropriately.
         """
-        with tracer.start_as_current_span(gen_ai_endpoint, kind= SpanKind.CLIENT) as span:
+        server_address, server_port = set_server_address_and_port(instance, "127.0.0.1", 80)
+        request_model = instance.model.config.name_or_path
+        span_name = f"{SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT} {request_model}"
+        with tracer.start_as_current_span(span_name, kind= SpanKind.CLIENT) as span:
+            start_time = time.time()
             response = wrapped(*args, **kwargs)
+            end_time = time.time()
             # pylint: disable=protected-access
             forward_params = instance._forward_params
@@ -67,27 +79,40 @@ def text_wrap(gen_ai_endpoint, version, environment, application_name,
                 else:
                     prompt = kwargs.get("args", "")
-                prompt_tokens = general_tokens(prompt[0])
+                input_tokens = general_tokens(prompt[0])
                 span.set_attribute(TELEMETRY_SDK_NAME, "openlit")
-                span.set_attribute(SemanticConvetion.GEN_AI_ENDPOINT,
-                                   gen_ai_endpoint)
+                span.set_attribute(SemanticConvetion.GEN_AI_OPERATION,
+                                   SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT)
                 span.set_attribute(SemanticConvetion.GEN_AI_SYSTEM,
                                    SemanticConvetion.GEN_AI_SYSTEM_HUGGING_FACE)
-                span.set_attribute(SemanticConvetion.GEN_AI_ENVIRONMENT,
-                                   environment)
-                span.set_attribute(SemanticConvetion.GEN_AI_APPLICATION_NAME,
-                                   application_name)
-                span.set_attribute(SemanticConvetion.GEN_AI_TYPE,
-                                   SemanticConvetion.GEN_AI_TYPE_CHAT)
                 span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MODEL,
-                                   instance.model.config.name_or_path)
+                                   request_model)
                 span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TEMPERATURE,
                                    forward_params.get("temperature", "null"))
                 span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_TOP_P,
                                    forward_params.get("top_p", "null"))
                 span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_MAX_TOKENS,
                                    forward_params.get("max_length", -1))
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_INPUT_TOKENS,
+                                   input_tokens)
+                span.set_attribute(SemanticConvetion.SERVER_ADDRESS,
+                                    server_address)
+                span.set_attribute(SemanticConvetion.SERVER_PORT,
+                                    server_port)
+                span.set_attribute(SemanticConvetion.GEN_AI_RESPONSE_MODEL,
+                                    request_model)
+                span.set_attribute(DEPLOYMENT_ENVIRONMENT,
+                                   environment)
+                span.set_attribute(SERVICE_NAME,
+                                   application_name)
+                span.set_attribute(SemanticConvetion.GEN_AI_REQUEST_IS_STREAM,
+                                    False)
+                span.set_attribute(SemanticConvetion.GEN_AI_SERVER_TTFT,
+                                    end_time - start_time)
+                span.set_attribute(SemanticConvetion.GEN_AI_SDK_VERSION,
+                                    version)
                 if trace_content:
                     span.add_event(
                         name=SemanticConvetion.GEN_AI_CONTENT_PROMPT_EVENT,
@@ -95,11 +120,9 @@ def text_wrap(gen_ai_endpoint, version, environment, application_name,
                             SemanticConvetion.GEN_AI_CONTENT_PROMPT: prompt,
                         },
                     )
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_PROMPT_TOKENS,
-                                prompt_tokens)
                 i = 0
-                completion_tokens = 0
+                output_tokens = 0
                 for completion in response:
                     if len(response) > 1:
                         attribute_name = f"gen_ai.content.completion.{i}"
@@ -115,43 +138,51 @@ def text_wrap(gen_ai_endpoint, version, environment, application_name,
                         span.add_event(
                             name=attribute_name,
                             attributes={
-                                # pylint: disable=line-too-long
                                 SemanticConvetion.GEN_AI_CONTENT_COMPLETION: llm_response,
                             },
                         )
-                    completion_tokens += general_tokens(llm_response)
+                    output_tokens += general_tokens(llm_response)
                     i=i+1
-                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COMPLETION_TOKENS,
-                                   completion_tokens)
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_OUTPUT_TOKENS,
+                                   output_tokens)
                 span.set_attribute(SemanticConvetion.GEN_AI_USAGE_TOTAL_TOKENS,
-                                   prompt_tokens + completion_tokens)
+                                   input_tokens + output_tokens)
+                # Calculate cost of the operation
+                cost = get_chat_model_cost(request_model,
+                                            pricing_info, input_tokens,
+                                            output_tokens)
+                span.set_attribute(SemanticConvetion.GEN_AI_USAGE_COST,
+                                    cost)
                 span.set_status(Status(StatusCode.OK))
                 if disable_metrics is False:
-                    attributes = {
-                        TELEMETRY_SDK_NAME:
-                            "openlit",
-                        SemanticConvetion.GEN_AI_APPLICATION_NAME:
-                            application_name,
-                        SemanticConvetion.GEN_AI_SYSTEM:
-                            SemanticConvetion.GEN_AI_SYSTEM_HUGGING_FACE,
-                        SemanticConvetion.GEN_AI_ENVIRONMENT:
-                            environment,
-                        SemanticConvetion.GEN_AI_TYPE:
-                            SemanticConvetion.GEN_AI_TYPE_CHAT,
-                        SemanticConvetion.GEN_AI_REQUEST_MODEL:
-                            instance.model.config.name_or_path
-                    }
+                    attributes = create_metrics_attributes(
+                        service_name=application_name,
+                        deployment_environment=environment,
+                        operation=SemanticConvetion.GEN_AI_OPERATION_TYPE_CHAT,
+                        system=SemanticConvetion.GEN_AI_SYSTEM_HUGGING_FACE,
+                        request_model=request_model,
+                        server_address=server_address,
+                        server_port=server_port,
+                        response_model=request_model,
+                    )
+                    metrics["genai_client_usage_tokens"].record(
+                        input_tokens + output_tokens, attributes
+                    )
+                    metrics["genai_client_operation_duration"].record(
+                        end_time - start_time, attributes
+                    )
+                    metrics["genai_server_ttft"].record(
+                        end_time - start_time, attributes
+                    )
                     metrics["genai_requests"].add(1, attributes)
-                    metrics["genai_total_tokens"].add(
-                        prompt_tokens +
-                        completion_tokens, attributes)
-                    metrics["genai_completion_tokens"].add(
-                        completion_tokens, attributes)
-                    metrics["genai_prompt_tokens"].add(
-                        prompt_tokens, attributes)
+                    metrics["genai_completion_tokens"].add(output_tokens, attributes)
+                    metrics["genai_prompt_tokens"].add(input_tokens, attributes)
+                    metrics["genai_cost"].record(cost, attributes)
                 # Return original response
                 return response

openlit/instrumentation/vertexai/__init__.py CHANGED Viewed

@@ -7,16 +7,10 @@ from opentelemetry.instrumentation.instrumentor import BaseInstrumentor
 from wrapt import wrap_function_wrapper
 from openlit.instrumentation.vertexai.vertexai import (
-    generate_content, predict, predict_streaming,
-    send_message, start_chat, start_chat_streaming,
-    embeddings
+    send_message
 )
 from openlit.instrumentation.vertexai.async_vertexai import (
-    generate_content_async, predict_async,
-    predict_streaming_async,
-    send_message_async,
-    start_chat_async, start_chat_streaming_async,
-    embeddings_async
+    async_send_message
 )
@@ -44,49 +38,28 @@ class VertexAIInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "vertexai.generative_models",
             "GenerativeModel.generate_content",
-            generate_content("vertexai.generate_content", version, environment, application_name,
+            send_message(version, environment, application_name,
                      tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.generative_models",
             "ChatSession.send_message",
-            send_message("vertexai.send_message", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextGenerationModel.predict",
-            predict("vertexai.predict", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextGenerationModel.predict_streaming",
-            predict_streaming("vertexai.predict", version, environment, application_name,
+            send_message(version, environment, application_name,
                      tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.language_models",
             "ChatSession.send_message",
-            start_chat("vertexai.send_message", version, environment, application_name,
+            send_message(version, environment, application_name,
                      tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.language_models",
             "ChatSession.send_message_streaming",
-            start_chat_streaming("vertexai.send_message", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextEmbeddingModel.get_embeddings",
-            embeddings("vertexai.get_embeddings", version, environment, application_name,
+            send_message(version, environment, application_name,
                      tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
@@ -94,52 +67,29 @@ class VertexAIInstrumentor(BaseInstrumentor):
         wrap_function_wrapper(
             "vertexai.generative_models",
             "GenerativeModel.generate_content_async",
-            generate_content_async("vertexai.generate_content", version, environment,
-                                   application_name, tracer, pricing_info, trace_content,
-                                   metrics, disable_metrics),
+            async_send_message(version, environment, application_name,
+                    tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.generative_models",
             "ChatSession.send_message_async",
-            send_message_async("vertexai.send_message", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextGenerationModel.predict_async",
-            predict_async("vertexai.predict", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextGenerationModel.predict_streaming_async",
-            predict_streaming_async("vertexai.predict", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
+            async_send_message(version, environment, application_name,
+                    tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.language_models",
             "ChatSession.send_message_async",
-            start_chat_async("vertexai.send_message", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
+            async_send_message(version, environment, application_name,
+                    tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
         wrap_function_wrapper(
             "vertexai.language_models",
             "ChatSession.send_message_streaming_async",
-            start_chat_streaming_async("vertexai.send_message", version, environment,
-                                       application_name, tracer, pricing_info, trace_content,
-                                       metrics, disable_metrics),
-        )
-        wrap_function_wrapper(
-            "vertexai.language_models",
-            "TextEmbeddingModel.get_embeddings_async",
-            embeddings_async("vertexai.get_embeddings", version, environment, application_name,
-                     tracer, pricing_info, trace_content, metrics, disable_metrics),
+            async_send_message(version, environment, application_name,
+                    tracer, pricing_info, trace_content, metrics, disable_metrics),
         )
     def _uninstrument(self, **kwargs):

openlit 1.33.8__py3-none-any.whl → 1.33.10__py3-none-any.whl

openlit 1.33.8py3-none-any.whl → 1.33.10py3-none-any.whl