PyPI - langtrace-python-sdk - Versions diffs - 2.1.29__py3-none-any.whl → 2.2.2__py3-none-any.whl - Mend

langtrace-python-sdk 2.1.29py3-none-any.whl → 2.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

examples/cohere_example/chat.py +1 -0
examples/cohere_example/chat_stream.py +3 -0
examples/dspy_example/math_problems_cot_parallel.py +59 -0
examples/gemini_example/__init__.py +6 -0
examples/gemini_example/function_tools.py +62 -0
examples/gemini_example/main.py +91 -0
examples/langchain_example/__init__.py +8 -0
examples/langchain_example/groq_example.py +28 -15
examples/ollama_example/basic.py +1 -0
examples/openai_example/__init__.py +1 -0
examples/openai_example/async_tool_calling_nonstreaming.py +1 -1
examples/openai_example/chat_completion.py +1 -1
examples/openai_example/embeddings_create.py +1 -0
examples/openai_example/images_edit.py +2 -2
examples/vertexai_example/__init__.py +6 -0
examples/vertexai_example/main.py +214 -0
langtrace_python_sdk/constants/instrumentation/common.py +2 -0
langtrace_python_sdk/constants/instrumentation/gemini.py +12 -0
langtrace_python_sdk/constants/instrumentation/vertexai.py +42 -0
langtrace_python_sdk/instrumentation/__init__.py +4 -0
langtrace_python_sdk/instrumentation/anthropic/patch.py +68 -96
langtrace_python_sdk/instrumentation/chroma/patch.py +29 -29
langtrace_python_sdk/instrumentation/cohere/patch.py +143 -242
langtrace_python_sdk/instrumentation/dspy/instrumentation.py +2 -2
langtrace_python_sdk/instrumentation/dspy/patch.py +36 -36
langtrace_python_sdk/instrumentation/gemini/__init__.py +3 -0
langtrace_python_sdk/instrumentation/gemini/instrumentation.py +36 -0
langtrace_python_sdk/instrumentation/gemini/patch.py +186 -0
langtrace_python_sdk/instrumentation/groq/patch.py +82 -125
langtrace_python_sdk/instrumentation/ollama/patch.py +62 -65
langtrace_python_sdk/instrumentation/openai/patch.py +190 -494
langtrace_python_sdk/instrumentation/qdrant/patch.py +6 -6
langtrace_python_sdk/instrumentation/vertexai/__init__.py +3 -0
langtrace_python_sdk/instrumentation/vertexai/instrumentation.py +33 -0
langtrace_python_sdk/instrumentation/vertexai/patch.py +131 -0
langtrace_python_sdk/langtrace.py +5 -0
langtrace_python_sdk/utils/__init__.py +14 -3
langtrace_python_sdk/utils/llm.py +311 -6
langtrace_python_sdk/version.py +1 -1
{langtrace_python_sdk-2.1.29.dist-info → langtrace_python_sdk-2.2.2.dist-info}/METADATA +26 -19
{langtrace_python_sdk-2.1.29.dist-info → langtrace_python_sdk-2.2.2.dist-info}/RECORD +58 -38
tests/anthropic/test_anthropic.py +28 -27
tests/cohere/test_cohere_chat.py +36 -36
tests/cohere/test_cohere_embed.py +12 -9
tests/cohere/test_cohere_rerank.py +18 -11
tests/groq/cassettes/test_async_chat_completion.yaml +113 -0
tests/groq/cassettes/test_async_chat_completion_streaming.yaml +2232 -0
tests/groq/cassettes/test_chat_completion.yaml +114 -0
tests/groq/cassettes/test_chat_completion_streaming.yaml +2512 -0
tests/groq/conftest.py +33 -0
tests/groq/test_groq.py +142 -0
tests/openai/cassettes/test_async_chat_completion_streaming.yaml +28 -28
tests/openai/test_chat_completion.py +53 -67
tests/openai/test_image_generation.py +47 -24
tests/utils.py +40 -5
{langtrace_python_sdk-2.1.29.dist-info → langtrace_python_sdk-2.2.2.dist-info}/WHEEL +0 -0
{langtrace_python_sdk-2.1.29.dist-info → langtrace_python_sdk-2.2.2.dist-info}/entry_points.txt +0 -0
{langtrace_python_sdk-2.1.29.dist-info → langtrace_python_sdk-2.2.2.dist-info}/licenses/LICENSE +0 -0

langtrace_python_sdk/instrumentation/groq/patch.py CHANGED Viewed

@@ -17,11 +17,21 @@ limitations under the License.
 import json
 from langtrace.trace_attributes import Event, LLMSpanAttributes
+from langtrace_python_sdk.utils import set_span_attribute
 from opentelemetry import baggage, trace
 from opentelemetry.trace.propagation import set_span_in_context
 from opentelemetry.trace import SpanKind
 from opentelemetry.trace.status import Status, StatusCode
+from langtrace_python_sdk.utils.llm import (
+    get_base_url,
+    get_extra_attributes,
+    get_llm_request_attributes,
+    get_llm_url,
+    get_langtrace_attributes,
+    set_event_completion,
+    set_usage_attributes,
+)
 from langtrace_python_sdk.constants.instrumentation.common import (
     LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY,
     SERVICE_PROVIDERS,
@@ -31,26 +41,20 @@ from langtrace_python_sdk.utils.llm import calculate_prompt_tokens, estimate_tok
 from importlib_metadata import version as v
 from langtrace_python_sdk.constants import LANGTRACE_SDK_NAME
+from langtrace.trace_attributes import SpanAttributes
 def chat_completions_create(original_method, version, tracer):
     """Wrap the `create` method of the `ChatCompletion` class to trace it."""
     def traced_method(wrapped, instance, args, kwargs):
-        base_url = (
-            str(instance._client._base_url)
-            if hasattr(instance, "_client") and hasattr(instance._client, "_base_url")
-            else ""
-        )
         service_provider = SERVICE_PROVIDERS["GROQ"]
         # If base url contains perplexity or azure, set the service provider accordingly
-        if "perplexity" in base_url:
+        if "perplexity" in get_base_url(instance):
             service_provider = SERVICE_PROVIDERS["PPLX"]
-        elif "azure" in base_url:
+        elif "azure" in get_base_url(instance):
             service_provider = SERVICE_PROVIDERS["AZURE"]
-        extra_attributes = baggage.get_baggage(LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY)
         # handle tool calls in the kwargs
         llm_prompts = []
         for item in kwargs.get("messages", []):
@@ -80,27 +84,16 @@ def chat_completions_create(original_method, version, tracer):
                 llm_prompts.append(item)
         span_attributes = {
-            "langtrace.sdk.name": "langtrace-python-sdk",
-            "langtrace.service.name": service_provider,
-            "langtrace.service.type": "llm",
-            "langtrace.service.version": version,
-            "langtrace.version": v(LANGTRACE_SDK_NAME),
-            "url.full": base_url,
-            "llm.api": APIS["CHAT_COMPLETION"]["ENDPOINT"],
-            "llm.prompts": json.dumps(llm_prompts),
-            "llm.stream": kwargs.get("stream"),
-            **(extra_attributes if extra_attributes is not None else {}),
+            **get_langtrace_attributes(version, service_provider),
+            **get_llm_request_attributes(kwargs, prompts=llm_prompts),
+            **get_llm_url(instance),
+            SpanAttributes.LLM_PATH: APIS["CHAT_COMPLETION"]["ENDPOINT"],
+            **get_extra_attributes(),
         }
         attributes = LLMSpanAttributes(**span_attributes)
         tools = []
-        if kwargs.get("temperature") is not None:
-            attributes.llm_temperature = kwargs.get("temperature")
-        if kwargs.get("top_p") is not None:
-            attributes.llm_top_p = kwargs.get("top_p")
-        if kwargs.get("user") is not None:
-            attributes.llm_user = kwargs.get("user")
         if kwargs.get("functions") is not None:
             for function in kwargs.get("functions"):
                 tools.append(json.dumps({"type": "function", "function": function}))
@@ -111,20 +104,21 @@ def chat_completions_create(original_method, version, tracer):
         # TODO(Karthik): Gotta figure out how to handle streaming with context
         # with tracer.start_as_current_span(APIS["CHAT_COMPLETION"]["METHOD"],
-        #                                   kind=SpanKind.CLIENT) as span:
+        #                                   kind=SpanKind.CLIENT.value) as span:
         span = tracer.start_span(
             APIS["CHAT_COMPLETION"]["METHOD"],
-            kind=SpanKind.CLIENT,
+            kind=SpanKind.CLIENT.value,
             context=set_span_in_context(trace.get_current_span()),
         )
         for field, value in attributes.model_dump(by_alias=True).items():
-            if value is not None:
-                span.set_attribute(field, value)
+            set_span_attribute(span, field, value)
         try:
             # Attempt to call the original method
             result = wrapped(*args, **kwargs)
             if kwargs.get("stream") is False or kwargs.get("stream") is None:
-                span.set_attribute("llm.model", result.model)
+                set_span_attribute(
+                    span, SpanAttributes.LLM_RESPONSE_MODEL, result.model
+                )
                 if hasattr(result, "choices") and result.choices is not None:
                     responses = [
                         {
@@ -146,27 +140,23 @@ def chat_completions_create(original_method, version, tracer):
                         }
                         for choice in result.choices
                     ]
-                    span.set_attribute("llm.responses", json.dumps(responses))
-                else:
-                    responses = []
-                    span.set_attribute("llm.responses", json.dumps(responses))
+                    set_event_completion(span, responses)
                 if (
                     hasattr(result, "system_fingerprint")
                     and result.system_fingerprint is not None
                 ):
-                    span.set_attribute(
-                        "llm.system.fingerprint", result.system_fingerprint
+                    set_span_attribute(
+                        span,
+                        SpanAttributes.LLM_SYSTEM_FINGERPRINT,
+                        result.system_fingerprint,
                     )
                 # Get the usage
                 if hasattr(result, "usage") and result.usage is not None:
                     usage = result.usage
-                    if usage is not None:
-                        usage_dict = {
-                            "input_tokens": result.usage.prompt_tokens,
-                            "output_tokens": usage.completion_tokens,
-                            "total_tokens": usage.total_tokens,
-                        }
-                        span.set_attribute("llm.token.counts", json.dumps(usage_dict))
+                    set_usage_attributes(span, dict(usage))
                 span.set_status(StatusCode.OK)
                 span.end()
                 return result
@@ -255,7 +245,7 @@ def chat_completions_create(original_method, version, tracer):
                 span.add_event(
                     Event.STREAM_OUTPUT.value,
                     {
-                        "response": (
+                        SpanAttributes.LLM_CONTENT_COMPLETION_CHUNK: (
                             "".join(content)
                             if len(content) > 0 and content[0] is not None
                             else ""
@@ -267,27 +257,14 @@ def chat_completions_create(original_method, version, tracer):
         finally:
             # Finalize span after processing all chunks
             span.add_event(Event.STREAM_END.value)
-            span.set_attribute(
-                "llm.token.counts",
-                json.dumps(
-                    {
-                        "input_tokens": prompt_tokens,
-                        "output_tokens": completion_tokens,
-                        "total_tokens": prompt_tokens + completion_tokens,
-                    }
-                ),
+            set_usage_attributes(
+                span,
+                {"input_tokens": prompt_tokens, "output_tokens": completion_tokens},
             )
-            span.set_attribute(
-                "llm.responses",
-                json.dumps(
-                    [
-                        {
-                            "role": "assistant",
-                            "content": "".join(result_content),
-                        }
-                    ]
-                ),
+            set_event_completion(
+                span, [{"role": "assistant", "content": "".join(result_content)}]
             )
             span.set_status(StatusCode.OK)
             span.end()
@@ -299,20 +276,13 @@ def async_chat_completions_create(original_method, version, tracer):
     """Wrap the `create` method of the `ChatCompletion` class to trace it."""
     async def traced_method(wrapped, instance, args, kwargs):
-        base_url = (
-            str(instance._client._base_url)
-            if hasattr(instance, "_client") and hasattr(instance._client, "_base_url")
-            else ""
-        )
         service_provider = SERVICE_PROVIDERS["GROQ"]
         # If base url contains perplexity or azure, set the service provider accordingly
-        if "perplexity" in base_url:
+        if "perplexity" in get_base_url(instance):
             service_provider = SERVICE_PROVIDERS["PPLX"]
-        elif "azure" in base_url:
+        elif "azure" in get_base_url(instance):
             service_provider = SERVICE_PROVIDERS["AZURE"]
-        extra_attributes = baggage.get_baggage(LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY)
         # handle tool calls in the kwargs
         llm_prompts = []
         for item in kwargs.get("messages", []):
@@ -342,27 +312,17 @@ def async_chat_completions_create(original_method, version, tracer):
                 llm_prompts.append(item)
         span_attributes = {
-            "langtrace.sdk.name": "langtrace-python-sdk",
-            "langtrace.service.name": service_provider,
-            "langtrace.service.type": "llm",
-            "langtrace.service.version": version,
-            "langtrace.version": v(LANGTRACE_SDK_NAME),
-            "url.full": base_url,
-            "llm.api": APIS["CHAT_COMPLETION"]["ENDPOINT"],
-            "llm.prompts": json.dumps(llm_prompts),
-            "llm.stream": kwargs.get("stream"),
-            **(extra_attributes if extra_attributes is not None else {}),
+            **get_langtrace_attributes(version, service_provider),
+            **get_llm_request_attributes(kwargs, prompts=llm_prompts),
+            **get_llm_url(instance),
+            SpanAttributes.LLM_PATH: APIS["CHAT_COMPLETION"]["ENDPOINT"],
+            **get_extra_attributes(),
         }
         attributes = LLMSpanAttributes(**span_attributes)
         tools = []
-        if kwargs.get("temperature") is not None:
-            attributes.llm_temperature = kwargs.get("temperature")
-        if kwargs.get("top_p") is not None:
-            attributes.llm_top_p = kwargs.get("top_p")
-        if kwargs.get("user") is not None:
-            attributes.llm_user = kwargs.get("user")
         if kwargs.get("functions") is not None:
             for function in kwargs.get("functions"):
                 tools.append(json.dumps({"type": "function", "function": function}))
@@ -373,18 +333,19 @@ def async_chat_completions_create(original_method, version, tracer):
         # TODO(Karthik): Gotta figure out how to handle streaming with context
         # with tracer.start_as_current_span(APIS["CHAT_COMPLETION"]["METHOD"],
-        #                                   kind=SpanKind.CLIENT) as span:
+        #                                   kind=SpanKind.CLIENT.value) as span:
         span = tracer.start_span(
-            APIS["CHAT_COMPLETION"]["METHOD"], kind=SpanKind.CLIENT
+            APIS["CHAT_COMPLETION"]["METHOD"], kind=SpanKind.CLIENT.value
         )
         for field, value in attributes.model_dump(by_alias=True).items():
-            if value is not None:
-                span.set_attribute(field, value)
+            set_span_attribute(span, field, value)
         try:
             # Attempt to call the original method
             result = await wrapped(*args, **kwargs)
             if kwargs.get("stream") is False or kwargs.get("stream") is None:
-                span.set_attribute("llm.model", result.model)
+                set_span_attribute(
+                    span, SpanAttributes.LLM_RESPONSE_MODEL, result.model
+                )
                 if hasattr(result, "choices") and result.choices is not None:
                     responses = [
                         {
@@ -406,27 +367,25 @@ def async_chat_completions_create(original_method, version, tracer):
                         }
                         for choice in result.choices
                     ]
-                    span.set_attribute("llm.responses", json.dumps(responses))
-                else:
-                    responses = []
-                    span.set_attribute("llm.responses", json.dumps(responses))
+                    set_event_completion(span, responses)
                 if (
                     hasattr(result, "system_fingerprint")
                     and result.system_fingerprint is not None
                 ):
-                    span.set_attribute(
-                        "llm.system.fingerprint", result.system_fingerprint
+                    set_span_attribute(
+                        span,
+                        SpanAttributes.LLM_SYSTEM_FINGERPRINT,
+                        result.system_fingerprint,
                     )
                 # Get the usage
                 if hasattr(result, "usage") and result.usage is not None:
                     usage = result.usage
                     if usage is not None:
-                        usage_dict = {
-                            "input_tokens": result.usage.prompt_tokens,
-                            "output_tokens": usage.completion_tokens,
-                            "total_tokens": usage.total_tokens,
-                        }
-                        span.set_attribute("llm.token.counts", json.dumps(usage_dict))
+                        set_usage_attributes(span, dict(usage))
                 span.set_status(StatusCode.OK)
                 span.end()
                 return result
@@ -469,6 +428,9 @@ def async_chat_completions_create(original_method, version, tracer):
         try:
             async for chunk in result:
                 if hasattr(chunk, "model") and chunk.model is not None:
+                    set_span_attribute(
+                        span, SpanAttributes.LLM_RESPONSE_MODEL, chunk.model
+                    )
                     span.set_attribute("llm.model", chunk.model)
                 if hasattr(chunk, "choices") and chunk.choices is not None:
                     if not function_call and not tool_calls:
@@ -513,9 +475,9 @@ def async_chat_completions_create(original_method, version, tracer):
                 else:
                     content = []
                 span.add_event(
-                    Event.STREAM_OUTPUT.value,
+                    Event.RESPONSE.value,
                     {
-                        "response": (
+                        SpanAttributes.LLM_COMPLETIONS: (
                             "".join(content)
                             if len(content) > 0 and content[0] is not None
                             else ""
@@ -527,27 +489,22 @@ def async_chat_completions_create(original_method, version, tracer):
         finally:
             # Finalize span after processing all chunks
             span.add_event(Event.STREAM_END.value)
-            span.set_attribute(
-                "llm.token.counts",
-                json.dumps(
+            set_usage_attributes(
+                span,
+                {"input_tokens": prompt_tokens, "output_tokens": completion_tokens},
+            )
+            set_event_completion(
+                span,
+                [
                     {
-                        "input_tokens": prompt_tokens,
-                        "output_tokens": completion_tokens,
-                        "total_tokens": prompt_tokens + completion_tokens,
+                        "role": "assistant",
+                        "content": "".join(result_content),
                     }
-                ),
-            )
-            span.set_attribute(
-                "llm.responses",
-                json.dumps(
-                    [
-                        {
-                            "role": "assistant",
-                            "content": "".join(result_content),
-                        }
-                    ]
-                ),
+                ],
             )
             span.set_status(StatusCode.OK)
             span.end()

langtrace_python_sdk/instrumentation/ollama/patch.py CHANGED Viewed

@@ -1,41 +1,35 @@
 from langtrace_python_sdk.constants.instrumentation.ollama import APIS
-from importlib_metadata import version as v
-from langtrace_python_sdk.constants import LANGTRACE_SDK_NAME
 from langtrace_python_sdk.utils import set_span_attribute
-from langtrace_python_sdk.utils.silently_fail import silently_fail
-from langtrace_python_sdk.constants.instrumentation.common import (
-    LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY,
-    SERVICE_PROVIDERS,
+from langtrace_python_sdk.utils.llm import (
+    get_extra_attributes,
+    get_langtrace_attributes,
+    get_llm_request_attributes,
+    get_llm_url,
+    set_event_completion,
 )
-from opentelemetry import baggage
+from langtrace_python_sdk.utils.silently_fail import silently_fail
+from langtrace_python_sdk.constants.instrumentation.common import SERVICE_PROVIDERS
 from langtrace.trace_attributes import LLMSpanAttributes, Event
 from opentelemetry.trace import SpanKind
 import json
 from opentelemetry.trace.status import Status, StatusCode
+from langtrace.trace_attributes import SpanAttributes
 def generic_patch(operation_name, version, tracer):
     def traced_method(wrapped, instance, args, kwargs):
-        base_url = (
-            str(instance._client._base_url)
-            if hasattr(instance, "_client") and hasattr(instance._client, "_base_url")
-            else ""
-        )
         api = APIS[operation_name]
         service_provider = SERVICE_PROVIDERS["OLLAMA"]
-        extra_attributes = baggage.get_baggage(LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY)
         span_attributes = {
-            "langtrace.sdk.name": "langtrace-python-sdk",
-            "langtrace.service.name": service_provider,
-            "langtrace.service.type": "llm",
-            "langtrace.service.version": version,
-            "langtrace.version": v(LANGTRACE_SDK_NAME),
-            "llm.model": kwargs.get("model"),
-            "llm.stream": kwargs.get("stream"),
-            "url.full": base_url,
-            "llm.api": api["ENDPOINT"],
-            "llm.response_format": kwargs.get("format"),
-            **(extra_attributes if extra_attributes is not None else {}),
+            **get_langtrace_attributes(version, service_provider),
+            **get_llm_request_attributes(
+                kwargs,
+                prompts=kwargs.get("messages", None),
+            ),
+            **get_llm_url(instance),
+            SpanAttributes.LLM_PATH: api["ENDPOINT"],
+            SpanAttributes.LLM_RESPONSE_FORMAT: kwargs.get("format"),
+            **get_extra_attributes(),
         }
         attributes = LLMSpanAttributes(**span_attributes)
@@ -77,24 +71,14 @@ def ageneric_patch(operation_name, version, tracer):
     async def traced_method(wrapped, instance, args, kwargs):
         api = APIS[operation_name]
         service_provider = SERVICE_PROVIDERS["OLLAMA"]
-        extra_attributes = baggage.get_baggage(LANGTRACE_ADDITIONAL_SPAN_ATTRIBUTES_KEY)
         span_attributes = {
-            "langtrace.sdk.name": "langtrace-python-sdk",
-            "langtrace.service.name": service_provider,
-            "url.full": "",
-            "llm.api": "",
-            "langtrace.service.type": "llm",
-            "langtrace.service.version": version,
-            "langtrace.version": v(LANGTRACE_SDK_NAME),
-            "llm.model": kwargs.get("model"),
-            "llm.stream": kwargs.get("stream"),
-            "llm.response_format": kwargs.get("format"),
-            "http.timeout": (
-                kwargs.get("keep_alive") if "keep_alive" in kwargs else None
-            ),
-            **(extra_attributes if extra_attributes is not None else {}),
+            **get_langtrace_attributes(version, service_provider),
+            **get_llm_request_attributes(kwargs),
+            **get_llm_url(instance),
+            SpanAttributes.LLM_PATH: api["ENDPOINT"],
+            SpanAttributes.LLM_RESPONSE_FORMAT: kwargs.get("format"),
+            **get_extra_attributes(),
         }
         attributes = LLMSpanAttributes(**span_attributes)
         with tracer.start_as_current_span(api["METHOD"], kind=SpanKind.CLIENT) as span:
             _set_input_attributes(span, kwargs, attributes)
@@ -130,23 +114,25 @@ def _set_response_attributes(span, response):
     input_tokens = response.get("prompt_eval_count") or 0
     output_tokens = response.get("eval_count") or 0
     total_tokens = input_tokens + output_tokens
-    usage_dict = {
-        "input_tokens": input_tokens,
-        "output_tokens": output_tokens,
-        "total_tokens": total_tokens,
-    }
     if total_tokens > 0:
-        set_span_attribute(span, "llm.token.counts", json.dumps(usage_dict))
-    set_span_attribute(span, "llm.finish_reason", response.get("done_reason"))
+        set_span_attribute(span, SpanAttributes.LLM_USAGE_PROMPT_TOKENS, input_tokens)
+        set_span_attribute(
+            span, SpanAttributes.LLM_USAGE_COMPLETION_TOKENS, output_tokens
+        )
+        set_span_attribute(span, SpanAttributes.LLM_USAGE_TOTAL_TOKENS, total_tokens)
+    set_span_attribute(
+        span,
+        SpanAttributes.LLM_RESPONSE_FINISH_REASON,
+        response.get("done_reason"),
+    )
     if "message" in response:
-        set_span_attribute(span, "llm.responses", json.dumps([response.get("message")]))
+        set_event_completion(span, [response.get("message")])
     if "response" in response:
-        set_span_attribute(
-            span,
-            "llm.responses",
-            json.dumps([{"role": "assistant", "content": response.get("response")}]),
+        set_event_completion(
+            span, [{"role": "assistant", "content": response.get("response")}]
         )
@@ -156,26 +142,23 @@ def _set_input_attributes(span, kwargs, attributes):
     for field, value in attributes.model_dump(by_alias=True).items():
         set_span_attribute(span, field, value)
-    if "messages" in kwargs:
+    if "options" in kwargs:
         set_span_attribute(
             span,
-            "llm.prompts",
-            json.dumps(kwargs.get("messages", [])),
+            SpanAttributes.LLM_REQUEST_TEMPERATURE,
+            options.get("temperature"),
         )
-    if "prompt" in kwargs:
+        set_span_attribute(span, SpanAttributes.LLM_REQUEST_TOP_P, options.get("top_p"))
         set_span_attribute(
             span,
-            "llm.prompts",
-            json.dumps([{"role": "user", "content": kwargs.get("prompt", "")}]),
+            SpanAttributes.LLM_FREQUENCY_PENALTY,
+            options.get("frequency_penalty"),
         )
-    if "options" in kwargs:
-        set_span_attribute(span, "llm.temperature", options.get("temperature"))
-        set_span_attribute(span, "llm.top_p", options.get("top_p"))
         set_span_attribute(
-            span, "llm.frequency_penalty", options.get("frequency_penalty")
-        )
-        set_span_attribute(
-            span, "llm.presence_penalty", options.get("presence_penalty")
+            span,
+            SpanAttributes.LLM_PRESENCE_PENALTY,
+            options.get("presence_penalty"),
         )
@@ -194,6 +177,14 @@ def _handle_streaming_response(span, response, api):
             if api == "generate":
                 accumulated_tokens["response"] += chunk["response"]
+            span.add_event(
+                Event.STREAM_OUTPUT.value,
+                {
+                    SpanAttributes.LLM_CONTENT_COMPLETION_CHUNK: chunk.get("response")
+                    or chunk.get("message").get("content"),
+                },
+            )
         _set_response_attributes(span, chunk | accumulated_tokens)
     finally:
         # Finalize span after processing all chunks
@@ -220,6 +211,12 @@ async def _ahandle_streaming_response(span, response, api):
             if api == "generate":
                 accumulated_tokens["response"] += chunk["response"]
+            span.add_event(
+                Event.STREAM_OUTPUT.value,
+                {
+                    SpanAttributes.LLM_CONTENT_COMPLETION_CHUNK: json.dumps(chunk),
+                },
+            )
         _set_response_attributes(span, chunk | accumulated_tokens)
     finally:
         # Finalize span after processing all chunks

langtrace-python-sdk 2.1.29__py3-none-any.whl → 2.2.2__py3-none-any.whl

langtrace-python-sdk 2.1.29py3-none-any.whl → 2.2.2py3-none-any.whl