PyPI - braintrust - Versions diffs - 0.3.14__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

braintrust 0.3.14py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

braintrust/__init__.py +4 -0
braintrust/_generated_types.py +1200 -611
braintrust/audit.py +2 -2
braintrust/cli/eval.py +6 -7
braintrust/cli/push.py +11 -11
braintrust/conftest.py +1 -0
braintrust/context.py +12 -17
braintrust/contrib/temporal/__init__.py +16 -27
braintrust/contrib/temporal/test_temporal.py +8 -3
braintrust/devserver/auth.py +8 -8
braintrust/devserver/cache.py +3 -4
braintrust/devserver/cors.py +8 -7
braintrust/devserver/dataset.py +3 -5
braintrust/devserver/eval_hooks.py +7 -6
braintrust/devserver/schemas.py +22 -19
braintrust/devserver/server.py +19 -12
braintrust/devserver/test_cached_login.py +4 -4
braintrust/framework.py +128 -140
braintrust/framework2.py +88 -87
braintrust/functions/invoke.py +93 -53
braintrust/functions/stream.py +3 -2
braintrust/generated_types.py +17 -1
braintrust/git_fields.py +11 -11
braintrust/gitutil.py +2 -3
braintrust/graph_util.py +10 -10
braintrust/id_gen.py +2 -2
braintrust/logger.py +346 -357
braintrust/merge_row_batch.py +10 -9
braintrust/oai.py +107 -24
braintrust/otel/__init__.py +49 -49
braintrust/otel/context.py +16 -30
braintrust/otel/test_distributed_tracing.py +14 -11
braintrust/otel/test_otel_bt_integration.py +32 -31
braintrust/parameters.py +8 -8
braintrust/prompt.py +14 -14
braintrust/prompt_cache/disk_cache.py +5 -4
braintrust/prompt_cache/lru_cache.py +3 -2
braintrust/prompt_cache/prompt_cache.py +13 -14
braintrust/queue.py +4 -4
braintrust/score.py +4 -4
braintrust/serializable_data_class.py +4 -4
braintrust/span_identifier_v1.py +1 -2
braintrust/span_identifier_v2.py +3 -4
braintrust/span_identifier_v3.py +23 -20
braintrust/span_identifier_v4.py +34 -25
braintrust/test_framework.py +16 -6
braintrust/test_helpers.py +5 -5
braintrust/test_id_gen.py +2 -3
braintrust/test_otel.py +61 -53
braintrust/test_queue.py +0 -1
braintrust/test_score.py +1 -3
braintrust/test_span_components.py +29 -44
braintrust/util.py +9 -8
braintrust/version.py +2 -2
braintrust/wrappers/_anthropic_utils.py +4 -4
braintrust/wrappers/agno/__init__.py +3 -4
braintrust/wrappers/agno/agent.py +1 -2
braintrust/wrappers/agno/function_call.py +1 -2
braintrust/wrappers/agno/model.py +1 -2
braintrust/wrappers/agno/team.py +1 -2
braintrust/wrappers/agno/utils.py +12 -12
braintrust/wrappers/anthropic.py +7 -8
braintrust/wrappers/claude_agent_sdk/__init__.py +3 -4
braintrust/wrappers/claude_agent_sdk/_wrapper.py +29 -27
braintrust/wrappers/dspy.py +15 -17
braintrust/wrappers/google_genai/__init__.py +16 -16
braintrust/wrappers/langchain.py +22 -24
braintrust/wrappers/litellm.py +4 -3
braintrust/wrappers/openai.py +15 -15
braintrust/wrappers/pydantic_ai.py +1204 -0
braintrust/wrappers/test_agno.py +0 -1
braintrust/wrappers/test_dspy.py +0 -1
braintrust/wrappers/test_google_genai.py +2 -3
braintrust/wrappers/test_litellm.py +0 -1
braintrust/wrappers/test_oai_attachments.py +322 -0
braintrust/wrappers/test_pydantic_ai_integration.py +1788 -0
braintrust/wrappers/{test_pydantic_ai.py → test_pydantic_ai_wrap_openai.py} +1 -2
{braintrust-0.3.14.dist-info → braintrust-0.4.0.dist-info}/METADATA +3 -2
braintrust-0.4.0.dist-info/RECORD +120 -0
braintrust-0.3.14.dist-info/RECORD +0 -117
{braintrust-0.3.14.dist-info → braintrust-0.4.0.dist-info}/WHEEL +0 -0
{braintrust-0.3.14.dist-info → braintrust-0.4.0.dist-info}/entry_points.txt +0 -0
{braintrust-0.3.14.dist-info → braintrust-0.4.0.dist-info}/top_level.txt +0 -0

braintrust/test_span_components.py CHANGED Viewed

@@ -6,7 +6,6 @@ Tests serialization, deserialization, OTEL compatibility, and backward compatibi
 from uuid import uuid4
 import pytest
 from braintrust.id_gen import OTELIDGenerator
 from braintrust.span_identifier_v3 import SpanComponentsV3, SpanObjectTypeV3
 from braintrust.span_identifier_v4 import SpanComponentsV4
@@ -22,7 +21,7 @@ class TestSpanComponentsV3:
             object_id=str(uuid4()),
             row_id=str(uuid4()),
             span_id=str(uuid4()),
-            root_span_id=str(uuid4())
+            root_span_id=str(uuid4()),
         )
         exported = components.to_str()
@@ -39,7 +38,7 @@ class TestSpanComponentsV3:
         components = SpanComponentsV3(
             object_type=SpanObjectTypeV3.EXPERIMENT,
             object_id=str(uuid4()),
-            propagated_event={"key": "value", "nested": {"a": 1}}
+            propagated_event={"key": "value", "nested": {"a": 1}},
         )
         exported = components.to_str()
@@ -53,15 +52,15 @@ class TestSpanComponentsV3:
         """Test that V3 fails to preserve OTEL hex strings for 16-byte IDs (converts to UUID format)."""
         otel_gen = OTELIDGenerator()
         trace_id = otel_gen.get_trace_id()  # 32-char hex (16 bytes)
-        span_id = otel_gen.get_span_id()    # 16-char hex (8 bytes)
+        span_id = otel_gen.get_span_id()  # 16-char hex (8 bytes)
         # Use 16-byte hex strings for object_id and root_span_id to see UUID conversion
         components = SpanComponentsV3(
             object_type=SpanObjectTypeV3.PROJECT_LOGS,
             object_id=trace_id,  # 16-byte hex should get converted to UUID format
-            row_id='test-row-id',
-            span_id=span_id,     # 8-byte hex might be preserved
-            root_span_id=trace_id  # 16-byte hex should get converted to UUID format
+            row_id="test-row-id",
+            span_id=span_id,  # 8-byte hex might be preserved
+            root_span_id=trace_id,  # 16-byte hex should get converted to UUID format
         )
         exported = components.to_str()
@@ -79,14 +78,14 @@ class TestSpanComponentsV4:
         """Test that V4 preserves OTEL hex strings exactly."""
         otel_gen = OTELIDGenerator()
         trace_id = otel_gen.get_trace_id()  # 32-char hex
-        span_id = otel_gen.get_span_id()    # 16-char hex
+        span_id = otel_gen.get_span_id()  # 16-char hex
         components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.PROJECT_LOGS,
-            object_id='test-project-id',
-            row_id='test-row-id',
+            object_id="test-project-id",
+            row_id="test-row-id",
             span_id=span_id,
-            root_span_id=trace_id
+            root_span_id=trace_id,
         )
         exported = components.to_str()
@@ -108,9 +107,9 @@ class TestSpanComponentsV4:
         components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.PROJECT_LOGS,
             object_id=uuid_object_id,
-            row_id='test-row-id',
+            row_id="test-row-id",
             span_id=uuid_span_id,
-            root_span_id=uuid_root_span_id
+            root_span_id=uuid_root_span_id,
         )
         exported = components.to_str()
@@ -133,9 +132,9 @@ class TestSpanComponentsV4:
         components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.EXPERIMENT,
             object_id=uuid_object_id,
-            row_id='test-row-id',
+            row_id="test-row-id",
             span_id=hex_span_id,
-            root_span_id=hex_trace_id
+            root_span_id=hex_trace_id,
         )
         exported = components.to_str()
@@ -162,10 +161,10 @@ class TestSpanComponentsV4:
         # Create equivalent Python object
         py_components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.EXPERIMENT,
-            object_id='js-test-experiment-id',
-            row_id='js-test-row-id',
-            span_id='abcdef1234567890',
-            root_span_id='fedcba0987654321fedcba0987654321'
+            object_id="js-test-experiment-id",
+            row_id="js-test-row-id",
+            span_id="abcdef1234567890",
+            root_span_id="fedcba0987654321fedcba0987654321",
         )
         # Python should generate the same slug
@@ -184,8 +183,8 @@ class TestSpanComponentsV4:
         """Test V4 with additional metadata."""
         components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.PLAYGROUND_LOGS,
-            object_id='test-session-id',
-            propagated_event={"user": "test", "data": [1, 2, 3]}
+            object_id="test-session-id",
+            propagated_event={"user": "test", "data": [1, 2, 3]},
         )
         exported = components.to_str()
@@ -199,14 +198,14 @@ class TestSpanComponentsV4:
         """Test that non-UUID/hex strings are stored in JSON portion."""
         components = SpanComponentsV4(
             object_type=SpanObjectTypeV3.PROJECT_LOGS,
-            object_id='not-a-uuid-or-hex',  # Will be stored in JSON
+            object_id="not-a-uuid-or-hex",  # Will be stored in JSON
             # Don't test row_id alone - if present, span_id and root_span_id must also be present
         )
         exported = components.to_str()
         imported = SpanComponentsV4.from_str(exported)
-        assert imported.object_id == 'not-a-uuid-or-hex'
+        assert imported.object_id == "not-a-uuid-or-hex"
 class TestBackwardCompatibility:
@@ -221,7 +220,7 @@ class TestBackwardCompatibility:
             row_id=str(uuid4()),
             span_id=str(uuid4()),
             root_span_id=str(uuid4()),
-            propagated_event={"version": "v3"}
+            propagated_event={"version": "v3"},
         )
         # Serialize with V3
@@ -238,7 +237,6 @@ class TestBackwardCompatibility:
         assert v4_imported.propagated_event == v3_components.propagated_event
 class TestErrorHandling:
     """Test error handling and edge cases."""
@@ -247,7 +245,7 @@ class TestErrorHandling:
         with pytest.raises(AssertionError):
             SpanComponentsV4(
                 object_type="invalid_type",  # Should be SpanObjectTypeV3 enum
-                object_id="test-id"
+                object_id="test-id",
             )
     def test_missing_required_fields(self):
@@ -280,10 +278,7 @@ class TestErrorHandling:
         import base64
         # Create valid data then corrupt it
-        components = SpanComponentsV4(
-            object_type=SpanObjectTypeV3.PROJECT_LOGS,
-            object_id="test-id"
-        )
+        components = SpanComponentsV4(object_type=SpanObjectTypeV3.PROJECT_LOGS, object_id="test-id")
         valid_exported = components.to_str()
         # Decode, corrupt, re-encode
@@ -302,30 +297,21 @@ class TestObjectIdFields:
     def test_experiment_object_id_fields(self):
         """Test object_id_fields for experiment type."""
-        components = SpanComponentsV4(
-            object_type=SpanObjectTypeV3.EXPERIMENT,
-            object_id="test-experiment-id"
-        )
+        components = SpanComponentsV4(object_type=SpanObjectTypeV3.EXPERIMENT, object_id="test-experiment-id")
         fields = components.object_id_fields()
         assert fields == {"experiment_id": "test-experiment-id"}
     def test_project_logs_object_id_fields(self):
         """Test object_id_fields for project_logs type."""
-        components = SpanComponentsV4(
-            object_type=SpanObjectTypeV3.PROJECT_LOGS,
-            object_id="test-project-id"
-        )
+        components = SpanComponentsV4(object_type=SpanObjectTypeV3.PROJECT_LOGS, object_id="test-project-id")
         fields = components.object_id_fields()
         assert fields == {"project_id": "test-project-id", "log_id": "g"}
     def test_playground_logs_object_id_fields(self):
         """Test object_id_fields for playground_logs type."""
-        components = SpanComponentsV4(
-            object_type=SpanObjectTypeV3.PLAYGROUND_LOGS,
-            object_id="test-session-id"
-        )
+        components = SpanComponentsV4(object_type=SpanObjectTypeV3.PLAYGROUND_LOGS, object_id="test-session-id")
         fields = components.object_id_fields()
         assert fields == {"prompt_session_id": "test-session-id", "log_id": "x"}
@@ -333,8 +319,7 @@ class TestObjectIdFields:
     def test_object_id_fields_without_object_id(self):
         """Test that object_id_fields raises error without object_id."""
         components = SpanComponentsV4(
-            object_type=SpanObjectTypeV3.PROJECT_LOGS,
-            compute_object_metadata_args={"key": "value"}
+            object_type=SpanObjectTypeV3.PROJECT_LOGS, compute_object_metadata_args={"key": "value"}
         )
         with pytest.raises(Exception) as exc_info:

braintrust/util.py CHANGED Viewed

@@ -2,8 +2,9 @@ import inspect
 import sys
 import threading
 import urllib.parse
+from collections.abc import Callable, Mapping
 from dataclasses import dataclass
-from typing import Any, Callable, Dict, Generic, Literal, Mapping, Optional, Set, Tuple, TypedDict, TypeVar, Union
+from typing import Any, Generic, Literal, TypedDict, TypeVar, Union
 from requests import HTTPError, Response
@@ -29,8 +30,8 @@ def coalesce(*args):
 def merge_dicts_with_paths(
-    merge_into: Dict[str, Any], merge_from: Mapping[str, Any], path: Tuple[str, ...], merge_paths: Set[Tuple[str]]
-) -> Dict[str, Any]:
+    merge_into: dict[str, Any], merge_from: Mapping[str, Any], path: tuple[str, ...], merge_paths: set[tuple[str]]
+) -> dict[str, Any]:
     """Merges merge_from into merge_into, destructively updating merge_into. Does not merge any further than
     merge_paths."""
@@ -50,7 +51,7 @@ def merge_dicts_with_paths(
     return merge_into
-def merge_dicts(merge_into: Dict[str, Any], merge_from: Mapping[str, Any]) -> Dict[str, Any]:
+def merge_dicts(merge_into: dict[str, Any], merge_from: Mapping[str, Any]) -> dict[str, Any]:
     """Merges merge_from into merge_into, destructively updating merge_into."""
     return merge_dicts_with_paths(merge_into, merge_from, (), set())
@@ -92,7 +93,7 @@ class CallerLocation(TypedDict):
     caller_lineno: int
-def get_caller_location() -> Optional[CallerLocation]:
+def get_caller_location() -> CallerLocation | None:
     frame = inspect.currentframe()
     while frame:
         frame = frame.f_back
@@ -145,7 +146,7 @@ class LazyValue(Generic[T]):
         return self._state.has_succeeded
     @property
-    def value(self) -> Optional[T]:
+    def value(self) -> T | None:
         return self._state.value if self._state.has_succeeded == True else None
     def get(self) -> T:
@@ -167,7 +168,7 @@ class LazyValue(Generic[T]):
             if self.mutex:
                 self.mutex.release()
-    def get_sync(self) -> Tuple[bool, Optional[T]]:
+    def get_sync(self) -> tuple[bool, T | None]:
         """Returns a tuple of (has_succeeded, value) without triggering evaluation."""
         if self._state.has_succeeded:
             # should be fine without the mutex check
@@ -206,7 +207,7 @@ def bt_iscoroutinefunction(f):
     return inspect.iscoroutinefunction(f) or inspect.isasyncgenfunction(f) or getattr(f, BT_IS_ASYNC_ATTRIBUTE, False)
-def add_azure_blob_headers(headers: Dict[str, str], url: str) -> None:
+def add_azure_blob_headers(headers: dict[str, str], url: str) -> None:
     # According to https://stackoverflow.com/questions/37824136/put-on-sas-blob-url-without-specifying-x-ms-blob-type-header,
     # there is no way to avoid including this.
     if "blob.core.windows.net" in url:

braintrust/version.py CHANGED Viewed

@@ -1,4 +1,4 @@
-VERSION = "0.3.14"
+VERSION = "0.4.0"
 # this will be templated during the build
-GIT_COMMIT = "dbbc1894ef31143816e5913676301261bc44aa4c"
+GIT_COMMIT = "8ab13f3f48af6a4d3c0b053e4bbabfd4f24f23ec"

braintrust/wrappers/_anthropic_utils.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """Shared utilities for Anthropic API wrappers."""
-from typing import Any, Dict
+from typing import Any
 class Wrapper:
@@ -13,7 +13,7 @@ class Wrapper:
         return getattr(self.__wrapped, name)
-def extract_anthropic_usage(usage: Any) -> Dict[str, float]:
+def extract_anthropic_usage(usage: Any) -> dict[str, float]:
     """Extract and normalize usage metrics from Anthropic usage object or dict.
     Converts Anthropic's usage format to Braintrust's standard token metric names.
@@ -29,7 +29,7 @@ def extract_anthropic_usage(usage: Any) -> Dict[str, float]:
         - prompt_cached_tokens (from cache_read_input_tokens)
         - prompt_cache_creation_tokens (from cache_creation_input_tokens)
     """
-    metrics: Dict[str, float] = {}
+    metrics: dict[str, float] = {}
     if not usage:
         return metrics
@@ -73,7 +73,7 @@ def extract_anthropic_usage(usage: Any) -> Dict[str, float]:
     return metrics
-def finalize_anthropic_tokens(metrics: Dict[str, float]) -> Dict[str, float]:
+def finalize_anthropic_tokens(metrics: dict[str, float]) -> dict[str, float]:
     """Finalize Anthropic token calculations.
     Anthropic doesn't include cache tokens in the total, so we need to sum them.

braintrust/wrappers/agno/__init__.py CHANGED Viewed

@@ -21,7 +21,6 @@ Usage:
 __all__ = ["setup_agno", "wrap_agent", "wrap_function_call", "wrap_model", "wrap_team"]
 import logging
-from typing import Optional
 from braintrust.logger import NOOP_SPAN, current_span, init_logger
@@ -34,9 +33,9 @@ logger = logging.getLogger(__name__)
 def setup_agno(
-    api_key: Optional[str] = None,
-    project_id: Optional[str] = None,
-    project_name: Optional[str] = None,
+    api_key: str | None = None,
+    project_id: str | None = None,
+    project_name: str | None = None,
 ) -> bool:
     """
     Setup Braintrust integration with Agno. Will automatically patch Agno agents, models, and function calls for tracing.

braintrust/wrappers/agno/agent.py CHANGED Viewed

@@ -1,10 +1,9 @@
 import time
 from typing import Any
-from wrapt import wrap_function_wrapper
 from braintrust.logger import start_span
 from braintrust.span_types import SpanTypeAttribute
+from wrapt import wrap_function_wrapper
 from .utils import (
     _aggregate_agent_chunks,

braintrust/wrappers/agno/function_call.py CHANGED Viewed

@@ -1,9 +1,8 @@
 from typing import Any
-from wrapt import wrap_function_wrapper
 from braintrust.logger import start_span
 from braintrust.span_types import SpanTypeAttribute
+from wrapt import wrap_function_wrapper
 from .utils import is_patched

braintrust/wrappers/agno/model.py CHANGED Viewed

@@ -5,10 +5,9 @@ ModelWrapper class for Braintrust-Agno model observability.
 import time
 from typing import Any
-from wrapt import wrap_function_wrapper
 from braintrust.logger import start_span
 from braintrust.span_types import SpanTypeAttribute
+from wrapt import wrap_function_wrapper
 from .utils import (
     _aggregate_model_chunks,

braintrust/wrappers/agno/team.py CHANGED Viewed

@@ -1,10 +1,9 @@
 import time
 from typing import Any
-from wrapt import wrap_function_wrapper
 from braintrust.logger import start_span
 from braintrust.span_types import SpanTypeAttribute
+from wrapt import wrap_function_wrapper
 from .utils import (
     _aggregate_agent_chunks,

braintrust/wrappers/agno/utils.py CHANGED Viewed

@@ -1,8 +1,8 @@
 import time
-from typing import Any, Dict, List, Optional
+from typing import Any
-def omit(obj: Dict[str, Any], keys: List[str]):
+def omit(obj: dict[str, Any], keys: list[str]):
     return {k: v for k, v in obj.items() if k not in keys}
@@ -14,11 +14,11 @@ def mark_patched(obj: Any):
     setattr(obj, "_braintrust_patched", True)
-def clean(obj: Dict[str, Any]) -> Dict[str, Any]:
+def clean(obj: dict[str, Any]) -> dict[str, Any]:
     return {k: v for k, v in obj.items() if v is not None}
-def get_args_kwargs(args: List[str], kwargs: Dict[str, Any], keys: List[str]):
+def get_args_kwargs(args: list[str], kwargs: dict[str, Any], keys: list[str]):
     return {k: args[i] if args else kwargs.get(k) for i, k in enumerate(keys)}, omit(kwargs, keys)
@@ -71,7 +71,7 @@ AGNO_METRICS_MAP = {
 }
-def extract_metadata(instance: Any, component: str) -> Dict[str, Any]:
+def extract_metadata(instance: Any, component: str) -> dict[str, Any]:
     """Extract metadata from any component (model, agent, team)."""
     metadata = {"component": component}
@@ -100,7 +100,7 @@ def extract_metadata(instance: Any, component: str) -> Dict[str, Any]:
     return metadata
-def parse_metrics_from_agno(usage: Any) -> Dict[str, Any]:
+def parse_metrics_from_agno(usage: Any) -> dict[str, Any]:
     """Parse metrics from Agno usage object, following OpenAI wrapper pattern."""
     metrics = {}
@@ -121,7 +121,7 @@ def parse_metrics_from_agno(usage: Any) -> Dict[str, Any]:
     return metrics
-def extract_metrics(result: Any, messages: Optional[list] = None) -> Dict[str, Any]:
+def extract_metrics(result: Any, messages: list | None = None) -> dict[str, Any]:
     """
     Unified metrics extraction for all components.
@@ -163,7 +163,7 @@ def extract_metrics(result: Any, messages: Optional[list] = None) -> Dict[str, A
     return {}
-def extract_streaming_metrics(aggregated: Dict[str, Any], start_time: float) -> Optional[Dict[str, Any]]:
+def extract_streaming_metrics(aggregated: dict[str, Any], start_time: float) -> dict[str, Any] | None:
     """Extract metrics from aggregated streaming response."""
     metrics = {}
@@ -187,7 +187,7 @@ def extract_streaming_metrics(aggregated: Dict[str, Any], start_time: float) ->
     return metrics if metrics else None
-def _aggregate_metrics(target: Dict[str, Any], source: Dict[str, Any]) -> None:
+def _aggregate_metrics(target: dict[str, Any], source: dict[str, Any]) -> None:
     """Aggregate metrics from source into target dict."""
     for key, value in source.items():
         if _is_numeric(value):
@@ -205,7 +205,7 @@ def _aggregate_metrics(target: Dict[str, Any], source: Dict[str, Any]) -> None:
                 target[key] = value
-def _aggregate_model_chunks(chunks: List[Any]) -> Dict[str, Any]:
+def _aggregate_model_chunks(chunks: list[Any]) -> dict[str, Any]:
     """Aggregate ModelResponse chunks from invoke_stream into a complete response."""
     aggregated = {
         "content": "",
@@ -263,7 +263,7 @@ def _aggregate_model_chunks(chunks: List[Any]) -> Dict[str, Any]:
     return aggregated
-def _aggregate_response_stream_chunks(chunks: List[Any]) -> Dict[str, Any]:
+def _aggregate_response_stream_chunks(chunks: list[Any]) -> dict[str, Any]:
     """
     Aggregate chunks from response_stream which can be ModelResponse, RunOutputEvent, or TeamRunOutputEvent.
@@ -344,7 +344,7 @@ def _aggregate_response_stream_chunks(chunks: List[Any]) -> Dict[str, Any]:
     return aggregated
-def _aggregate_agent_chunks(chunks: List[Any]) -> Dict[str, Any]:
+def _aggregate_agent_chunks(chunks: list[Any]) -> dict[str, Any]:
     """Aggregate BaseAgentRunEvent/BaseTeamRunEvent chunks into a complete response."""
     aggregated = {
         "content": "",

braintrust/wrappers/anthropic.py CHANGED Viewed

@@ -2,7 +2,6 @@ import logging
 import time
 import warnings
 from contextlib import contextmanager
-from typing import Optional
 from braintrust.logger import NOOP_SPAN, log_exc_info_to_span, start_span
 from braintrust.wrappers._anthropic_utils import Wrapper, extract_anthropic_usage, finalize_anthropic_tokens
@@ -10,7 +9,6 @@ from braintrust.wrappers._anthropic_utils import Wrapper, extract_anthropic_usag
 log = logging.getLogger(__name__)
 # This tracer depends on an internal anthropic method used to merge
 # streamed messages together. It's a bit tricky so I'm opting to use it
 # here. If it goes away, this polyfill will make it a no-op and the only
@@ -242,7 +240,7 @@ class TracedMessageStream(Wrapper):
         self.__metrics = {}
         self.__snapshot = None
         self.__request_start_time = request_start_time
-        self.__time_to_first_token: Optional[float] = None
+        self.__time_to_first_token: float | None = None
     def _get_final_traced_message(self):
         return self.__snapshot
@@ -314,7 +312,7 @@ def _start_span(name, kwargs):
     return NOOP_SPAN
-def _log_message_to_span(message, span, time_to_first_token: Optional[float] = None):
+def _log_message_to_span(message, span, time_to_first_token: float | None = None):
     """Log telemetry from the given anthropic.Message to the given span."""
     with _catch_exceptions():
         usage = getattr(message, "usage", {})
@@ -326,13 +324,14 @@ def _log_message_to_span(message, span, time_to_first_token: Optional[float] = N
         # Create output dict with only truthy values for role and content
         output = {
-            k: v for k, v in {
-                "role": getattr(message, "role", None),
-                "content": getattr(message, "content", None)
-            }.items() if v
+            k: v
+            for k, v in {"role": getattr(message, "role", None), "content": getattr(message, "content", None)}.items()
+            if v
         } or None
         span.log(output=output, metrics=metrics)
 @contextmanager
 def _catch_exceptions():
     try:

braintrust/wrappers/claude_agent_sdk/__init__.py CHANGED Viewed

@@ -16,7 +16,6 @@ Usage (imports can be before or after setup):
 """
 import logging
-from typing import Optional
 from braintrust.logger import NOOP_SPAN, current_span, init_logger
@@ -28,9 +27,9 @@ __all__ = ["setup_claude_agent_sdk"]
 def setup_claude_agent_sdk(
-    api_key: Optional[str] = None,
-    project_id: Optional[str] = None,
-    project: Optional[str] = None,
+    api_key: str | None = None,
+    project_id: str | None = None,
+    project: str | None = None,
 ) -> bool:
     """
     Setup Braintrust integration with Claude Agent SDK. Will automatically patch the SDK for automatic tracing.

braintrust 0.3.14__py3-none-any.whl → 0.4.0__py3-none-any.whl

braintrust 0.3.14py3-none-any.whl → 0.4.0py3-none-any.whl