PyPI - nvidia-nat - Versions diffs - 1.3.0a20250910__py3-none-any.whl → 1.4.0a20251112__py3-none-any.whl - Mend

nvidia-nat 1.3.0a20250910py3-none-any.whl → 1.4.0a20251112py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (213) hide show

nat/agent/base.py +13 -8
nat/agent/prompt_optimizer/prompt.py +68 -0
nat/agent/prompt_optimizer/register.py +149 -0
nat/agent/react_agent/agent.py +6 -5
nat/agent/react_agent/register.py +49 -39
nat/agent/reasoning_agent/reasoning_agent.py +17 -15
nat/agent/register.py +2 -0
nat/agent/responses_api_agent/__init__.py +14 -0
nat/agent/responses_api_agent/register.py +126 -0
nat/agent/rewoo_agent/agent.py +304 -117
nat/agent/rewoo_agent/prompt.py +19 -22
nat/agent/rewoo_agent/register.py +51 -38
nat/agent/tool_calling_agent/agent.py +75 -17
nat/agent/tool_calling_agent/register.py +46 -23
nat/authentication/api_key/api_key_auth_provider.py +6 -11
nat/authentication/api_key/api_key_auth_provider_config.py +8 -5
nat/authentication/credential_validator/__init__.py +14 -0
nat/authentication/credential_validator/bearer_token_validator.py +557 -0
nat/authentication/http_basic_auth/http_basic_auth_provider.py +1 -1
nat/authentication/interfaces.py +5 -2
nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +69 -36
nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +2 -1
nat/authentication/oauth2/oauth2_resource_server_config.py +125 -0
nat/builder/builder.py +55 -23
nat/builder/component_utils.py +9 -5
nat/builder/context.py +54 -15
nat/builder/eval_builder.py +14 -9
nat/builder/framework_enum.py +1 -0
nat/builder/front_end.py +1 -1
nat/builder/function.py +370 -0
nat/builder/function_info.py +1 -1
nat/builder/intermediate_step_manager.py +38 -2
nat/builder/workflow.py +5 -0
nat/builder/workflow_builder.py +306 -54
nat/cli/cli_utils/config_override.py +1 -1
nat/cli/commands/info/info.py +16 -6
nat/cli/commands/mcp/__init__.py +14 -0
nat/cli/commands/mcp/mcp.py +986 -0
nat/cli/commands/optimize.py +90 -0
nat/cli/commands/start.py +1 -1
nat/cli/commands/workflow/templates/config.yml.j2 +14 -13
nat/cli/commands/workflow/templates/register.py.j2 +2 -2
nat/cli/commands/workflow/templates/workflow.py.j2 +35 -21
nat/cli/commands/workflow/workflow_commands.py +60 -18
nat/cli/entrypoint.py +15 -11
nat/cli/main.py +3 -0
nat/cli/register_workflow.py +38 -4
nat/cli/type_registry.py +72 -1
nat/control_flow/__init__.py +0 -0
nat/control_flow/register.py +20 -0
nat/control_flow/router_agent/__init__.py +0 -0
nat/control_flow/router_agent/agent.py +329 -0
nat/control_flow/router_agent/prompt.py +48 -0
nat/control_flow/router_agent/register.py +91 -0
nat/control_flow/sequential_executor.py +166 -0
nat/data_models/agent.py +34 -0
nat/data_models/api_server.py +199 -69
nat/data_models/authentication.py +23 -9
nat/data_models/common.py +47 -0
nat/data_models/component.py +2 -0
nat/data_models/component_ref.py +11 -0
nat/data_models/config.py +41 -17
nat/data_models/dataset_handler.py +4 -3
nat/data_models/function.py +34 -0
nat/data_models/function_dependencies.py +8 -0
nat/data_models/intermediate_step.py +9 -1
nat/data_models/llm.py +15 -1
nat/data_models/openai_mcp.py +46 -0
nat/data_models/optimizable.py +208 -0
nat/data_models/optimizer.py +161 -0
nat/data_models/span.py +41 -3
nat/data_models/thinking_mixin.py +2 -2
nat/embedder/azure_openai_embedder.py +2 -1
nat/embedder/nim_embedder.py +3 -2
nat/embedder/openai_embedder.py +3 -2
nat/eval/config.py +1 -1
nat/eval/dataset_handler/dataset_downloader.py +3 -2
nat/eval/dataset_handler/dataset_filter.py +34 -2
nat/eval/evaluate.py +10 -3
nat/eval/evaluator/base_evaluator.py +1 -1
nat/eval/rag_evaluator/evaluate.py +7 -4
nat/eval/register.py +4 -0
nat/eval/runtime_evaluator/__init__.py +14 -0
nat/eval/runtime_evaluator/evaluate.py +123 -0
nat/eval/runtime_evaluator/register.py +100 -0
nat/eval/swe_bench_evaluator/evaluate.py +1 -1
nat/eval/trajectory_evaluator/register.py +1 -1
nat/eval/tunable_rag_evaluator/evaluate.py +1 -1
nat/eval/usage_stats.py +2 -0
nat/eval/utils/output_uploader.py +3 -2
nat/eval/utils/weave_eval.py +17 -3
nat/experimental/decorators/experimental_warning_decorator.py +27 -7
nat/experimental/test_time_compute/functions/execute_score_select_function.py +1 -1
nat/experimental/test_time_compute/functions/plan_select_execute_function.py +7 -3
nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +1 -1
nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +3 -3
nat/experimental/test_time_compute/models/strategy_base.py +2 -2
nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +1 -1
nat/front_ends/console/authentication_flow_handler.py +82 -30
nat/front_ends/console/console_front_end_plugin.py +19 -7
nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +1 -1
nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +52 -17
nat/front_ends/fastapi/dask_client_mixin.py +65 -0
nat/front_ends/fastapi/fastapi_front_end_config.py +25 -3
nat/front_ends/fastapi/fastapi_front_end_plugin.py +140 -3
nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +445 -265
nat/front_ends/fastapi/job_store.py +518 -99
nat/front_ends/fastapi/main.py +11 -19
nat/front_ends/fastapi/message_handler.py +69 -44
nat/front_ends/fastapi/message_validator.py +8 -7
nat/front_ends/fastapi/utils.py +57 -0
nat/front_ends/mcp/introspection_token_verifier.py +73 -0
nat/front_ends/mcp/mcp_front_end_config.py +71 -3
nat/front_ends/mcp/mcp_front_end_plugin.py +85 -21
nat/front_ends/mcp/mcp_front_end_plugin_worker.py +248 -29
nat/front_ends/mcp/memory_profiler.py +320 -0
nat/front_ends/mcp/tool_converter.py +78 -25
nat/front_ends/simple_base/simple_front_end_plugin_base.py +3 -1
nat/llm/aws_bedrock_llm.py +21 -8
nat/llm/azure_openai_llm.py +14 -5
nat/llm/litellm_llm.py +80 -0
nat/llm/nim_llm.py +23 -9
nat/llm/openai_llm.py +19 -7
nat/llm/register.py +4 -0
nat/llm/utils/thinking.py +1 -1
nat/observability/exporter/base_exporter.py +1 -1
nat/observability/exporter/processing_exporter.py +29 -55
nat/observability/exporter/span_exporter.py +43 -15
nat/observability/exporter_manager.py +2 -2
nat/observability/mixin/redaction_config_mixin.py +5 -4
nat/observability/mixin/tagging_config_mixin.py +26 -14
nat/observability/mixin/type_introspection_mixin.py +420 -107
nat/observability/processor/batching_processor.py +1 -1
nat/observability/processor/processor.py +3 -0
nat/observability/processor/redaction/__init__.py +24 -0
nat/observability/processor/redaction/contextual_redaction_processor.py +125 -0
nat/observability/processor/redaction/contextual_span_redaction_processor.py +66 -0
nat/observability/processor/redaction/redaction_processor.py +177 -0
nat/observability/processor/redaction/span_header_redaction_processor.py +92 -0
nat/observability/processor/span_tagging_processor.py +21 -14
nat/observability/register.py +16 -0
nat/profiler/callbacks/langchain_callback_handler.py +32 -7
nat/profiler/callbacks/llama_index_callback_handler.py +36 -2
nat/profiler/callbacks/token_usage_base_model.py +2 -0
nat/profiler/decorators/framework_wrapper.py +61 -9
nat/profiler/decorators/function_tracking.py +35 -3
nat/profiler/forecasting/models/linear_model.py +1 -1
nat/profiler/forecasting/models/random_forest_regressor.py +1 -1
nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +1 -1
nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +1 -1
nat/profiler/parameter_optimization/__init__.py +0 -0
nat/profiler/parameter_optimization/optimizable_utils.py +93 -0
nat/profiler/parameter_optimization/optimizer_runtime.py +67 -0
nat/profiler/parameter_optimization/parameter_optimizer.py +189 -0
nat/profiler/parameter_optimization/parameter_selection.py +107 -0
nat/profiler/parameter_optimization/pareto_visualizer.py +460 -0
nat/profiler/parameter_optimization/prompt_optimizer.py +384 -0
nat/profiler/parameter_optimization/update_helpers.py +66 -0
nat/profiler/utils.py +3 -1
nat/registry_handlers/pypi/register_pypi.py +5 -3
nat/registry_handlers/rest/register_rest.py +5 -3
nat/retriever/milvus/retriever.py +1 -1
nat/retriever/nemo_retriever/register.py +2 -1
nat/runtime/loader.py +1 -1
nat/runtime/runner.py +111 -6
nat/runtime/session.py +49 -3
nat/settings/global_settings.py +2 -2
nat/tool/chat_completion.py +4 -1
nat/tool/code_execution/code_sandbox.py +3 -6
nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +19 -32
nat/tool/code_execution/local_sandbox/local_sandbox_server.py +6 -1
nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +2 -0
nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +10 -4
nat/tool/datetime_tools.py +1 -1
nat/tool/github_tools.py +450 -0
nat/tool/memory_tools/add_memory_tool.py +3 -3
nat/tool/memory_tools/delete_memory_tool.py +3 -4
nat/tool/memory_tools/get_memory_tool.py +4 -4
nat/tool/register.py +2 -7
nat/tool/server_tools.py +15 -2
nat/utils/__init__.py +76 -0
nat/utils/callable_utils.py +70 -0
nat/utils/data_models/schema_validator.py +1 -1
nat/utils/decorators.py +210 -0
nat/utils/exception_handlers/automatic_retries.py +278 -72
nat/utils/io/yaml_tools.py +73 -3
nat/utils/log_levels.py +25 -0
nat/utils/responses_api.py +26 -0
nat/utils/string_utils.py +16 -0
nat/utils/type_converter.py +12 -3
nat/utils/type_utils.py +6 -2
nvidia_nat-1.4.0a20251112.dist-info/METADATA +197 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/RECORD +199 -165
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/entry_points.txt +1 -0
nat/cli/commands/info/list_mcp.py +0 -461
nat/data_models/temperature_mixin.py +0 -43
nat/data_models/top_p_mixin.py +0 -43
nat/observability/processor/header_redaction_processor.py +0 -123
nat/observability/processor/redaction_processor.py +0 -77
nat/tool/code_execution/test_code_execution_sandbox.py +0 -414
nat/tool/github_tools/create_github_commit.py +0 -133
nat/tool/github_tools/create_github_issue.py +0 -87
nat/tool/github_tools/create_github_pr.py +0 -106
nat/tool/github_tools/get_github_file.py +0 -106
nat/tool/github_tools/get_github_issue.py +0 -166
nat/tool/github_tools/get_github_pr.py +0 -256
nat/tool/github_tools/update_github_issue.py +0 -100
nvidia_nat-1.3.0a20250910.dist-info/METADATA +0 -373
/nat/{tool/github_tools → agent/prompt_optimizer}/__init__.py +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/WHEEL +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/licenses/LICENSE-3rd-party.txt +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/licenses/LICENSE.md +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/top_level.txt +0 -0

nat/observability/processor/redaction/contextual_redaction_processor.py ADDED Viewed

@@ -0,0 +1,125 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from abc import abstractmethod
+from collections.abc import Callable
+from typing import Any
+from typing import TypeVar
+from nat.observability.processor.redaction.redaction_processor import RedactionContext
+from nat.observability.processor.redaction.redaction_processor import RedactionContextState
+from nat.observability.processor.redaction.redaction_processor import RedactionInputT
+from nat.observability.processor.redaction.redaction_processor import RedactionProcessor
+from nat.utils.type_utils import override
+logger = logging.getLogger(__name__)
+# Type variable for the data type extracted from context
+RedactionDataT = TypeVar('RedactionDataT')
+class ContextualRedactionProcessor(RedactionProcessor[RedactionInputT, RedactionDataT]):
+    """Generic processor with context-aware caching for any data type.
+    Provides a framework for redaction processors that need to:
+    - Extract data from the request context (headers, cookies, query params, etc.)
+    - Execute callbacks to determine redaction decisions
+    - Cache results within the request context to avoid redundant callback executions
+    - Handle race conditions with atomic operations
+    This class handles all the generic caching, context management, and callback
+    execution logic. Subclasses only need to implement data extraction and validation.
+    Args:
+        callback: Callable that determines if redaction should occur based on extracted data
+        enabled: Whether the processor is enabled
+        force_redact: If True, always redact regardless of data checks
+        redaction_value: The value to replace redacted attributes with
+    """
+    def __init__(
+        self,
+        callback: Callable[..., Any],
+        enabled: bool,
+        force_redact: bool,
+        redaction_value: str,
+    ):
+        self.callback = callback
+        self.enabled = enabled
+        self.force_redact = force_redact
+        self.redaction_value = redaction_value
+        self._redaction_context = RedactionContext(RedactionContextState())
+    @abstractmethod
+    def extract_data_from_context(self) -> RedactionDataT | None:
+        """Extract the relevant data from the context for redaction decision.
+        This method must be implemented by subclasses to extract their specific
+        data type (headers, cookies, query params, etc.) from the request context
+        Returns:
+            RedactionDataT | None: The extracted data, or None if no relevant data found
+        """
+        pass
+    @abstractmethod
+    def validate_data(self, data: RedactionDataT) -> bool:
+        """Validate that the extracted data is suitable for callback execution.
+        This method allows subclasses to implement their own validation logic
+        (e.g., checking if headers exist, if cookies are not empty, etc.).
+        Args:
+            data (RedactionDataT): The extracted data to validate
+        Returns:
+            bool: True if the data is valid for callback execution, False otherwise
+        """
+        pass
+    @override
+    async def should_redact(self, item: RedactionInputT) -> bool:
+        """Determine if this span should be redacted based on extracted data.
+        Extracts the relevant data from the context, validates it, and passes it to the
+        callback function to determine if redaction should occur. Results are cached
+        within the request context to avoid redundant callback executions.
+        Args:
+            item (RedactionInputT): The item to check
+        Returns:
+            bool: True if the span should be redacted, False otherwise
+        """
+        # If force_redact is enabled, always redact regardless of other conditions
+        if self.force_redact:
+            return True
+        if not self.enabled:
+            return False
+        # Extract data using subclass implementation
+        data = self.extract_data_from_context()
+        if data is None:
+            return False
+        # Validate data using subclass implementation
+        if not self.validate_data(data):
+            return False
+        # Use the generic caching framework for callback execution
+        async with self._redaction_context.redaction_manager() as manager:
+            return await manager.redaction_check(self.callback, data)

nat/observability/processor/redaction/contextual_span_redaction_processor.py ADDED Viewed

@@ -0,0 +1,66 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from collections.abc import Callable
+from typing import Any
+from nat.data_models.span import Span
+from nat.observability.processor.redaction.contextual_redaction_processor import ContextualRedactionProcessor
+from nat.observability.processor.redaction.redaction_processor import RedactionDataT
+from nat.utils.type_utils import override
+class ContextualSpanRedactionProcessor(ContextualRedactionProcessor[Span, RedactionDataT]):
+    """Processor that redacts the Span based on the Span attributes.
+    Args:
+        attributes: List of span attribute keys to redact
+        callback: Callable that determines if redaction should occur
+        enabled: Whether the processor is enabled
+        force_redact: If True, always redact regardless of callback
+        redaction_value: The value to replace redacted attributes with
+    """
+    def __init__(self,
+                 attributes: list[str],
+                 callback: Callable[..., Any],
+                 enabled: bool,
+                 force_redact: bool,
+                 redaction_value: str,
+                 redaction_tag: str | None = None):
+        super().__init__(callback=callback, enabled=enabled, force_redact=force_redact, redaction_value=redaction_value)
+        self.attributes = attributes
+        self.redaction_tag = redaction_tag
+    @override
+    async def redact_item(self, item: Span) -> Span:
+        """Redact specified attributes in the span.
+        Replaces the values of configured attributes with the redaction value.
+        Args:
+            item (Span): The span to redact
+        Returns:
+            Span: The span with redacted attributes
+        """
+        for key in self.attributes:
+            if key in item.attributes:
+                item.set_attribute(key, self.redaction_value)
+        if self.redaction_tag:
+            item.set_attribute(self.redaction_tag, True)
+        return item

nat/observability/processor/redaction/redaction_processor.py ADDED Viewed

@@ -0,0 +1,177 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from abc import abstractmethod
+from collections.abc import AsyncGenerator
+from collections.abc import Callable
+from contextlib import asynccontextmanager
+from contextvars import ContextVar
+from dataclasses import dataclass
+from dataclasses import field
+from typing import Any
+from typing import Generic
+from typing import TypeVar
+from nat.observability.processor.processor import Processor
+from nat.utils.callable_utils import ainvoke_any
+from nat.utils.type_utils import override
+RedactionInputT = TypeVar('RedactionInputT')
+RedactionDataT = TypeVar('RedactionDataT')
+logger = logging.getLogger(__name__)
+class RedactionProcessor(Processor[RedactionInputT, RedactionInputT], Generic[RedactionInputT, RedactionDataT]):
+    """Abstract base class for redaction processors."""
+    @abstractmethod
+    async def should_redact(self, item: RedactionInputT) -> bool:
+        """Determine if this item should be redacted.
+        Args:
+            item (RedactionInputT): The item to check.
+        Returns:
+            bool: True if the item should be redacted, False otherwise.
+        """
+        pass
+    @abstractmethod
+    async def redact_item(self, item: RedactionInputT) -> RedactionInputT:
+        """Redact the item.
+        Args:
+            item (RedactionInputT): The item to redact.
+        Returns:
+            RedactionInputT: The redacted item.
+        """
+        pass
+    @override
+    async def process(self, item: RedactionInputT) -> RedactionInputT:
+        """Perform redaction on the item if it should be redacted.
+        Args:
+            item (RedactionInputT): The item to process.
+        Returns:
+            RedactionInputT: The processed item.
+        """
+        if await self.should_redact(item):
+            return await self.redact_item(item)
+        return item
+@dataclass
+class RedactionContextState:
+    """Generic context state for redaction results.
+    Stores the redaction result in a context variable to avoid redundant
+    callback executions within the same request context.
+    """
+    redaction_result: ContextVar[bool
+                                 | None] = field(default_factory=lambda: ContextVar("redaction_result", default=None))
+class RedactionManager(Generic[RedactionDataT]):
+    """Generic manager for atomic redaction operations.
+    Handles state mutations and ensures atomic callback execution
+    with proper result caching within a request context.
+    Args:
+        RedactionDataT: The type of data being processed for redaction decisions.
+    """
+    def __init__(self, context_state: RedactionContextState):
+        self._context_state = context_state
+    def set_redaction_result(self, result: bool) -> None:
+        """Set the redaction result in the context.
+        Args:
+            result (bool): The redaction result to cache.
+        """
+        self._context_state.redaction_result.set(result)
+    def clear_redaction_result(self) -> None:
+        """Clear the cached redaction result from the context."""
+        self._context_state.redaction_result.set(None)
+    async def redaction_check(self, callback: Callable[..., Any], data: RedactionDataT) -> bool:
+        """Execute redaction callback with atomic result caching.
+        Checks for existing cached results first, then executes the callback
+        and caches the result atomically. Since data is static per request,
+        subsequent calls within the same context return the cached result.
+        Supports sync/async functions, generators, and async generators.
+        Args:
+            callback (Callable[..., Any]): The callback to execute (sync/async function, generator, etc.).
+            data (RedactionDataT): The data to pass to the callback for redaction decision.
+        Returns:
+            bool: True if the item should be redacted, False otherwise.
+        """
+        # Check if we already have a result for this context
+        existing_result = self._context_state.redaction_result.get()
+        if existing_result is not None:
+            return existing_result
+        # Execute callback and cache result
+        result_value = await ainvoke_any(callback, data)
+        result = bool(result_value)
+        self.set_redaction_result(result)
+        return result
+class RedactionContext(Generic[RedactionDataT]):
+    """Generic context provider for redaction operations.
+    Provides read-only access to redaction state and manages the
+    RedactionManager lifecycle through async context managers.
+    Args:
+        RedactionDataT: The type of data being processed for redaction decisions.
+    """
+    def __init__(self, context: RedactionContextState):
+        self._context_state: RedactionContextState = context
+    @property
+    def redaction_result(self) -> bool | None:
+        """Get the current redaction result from context.
+        Returns:
+            bool | None: The cached redaction result, or None if not set.
+        """
+        return self._context_state.redaction_result.get()
+    @asynccontextmanager
+    async def redaction_manager(self) -> AsyncGenerator[RedactionManager[RedactionDataT], None]:
+        """Provide a redaction manager within an async context.
+        Creates and yields a RedactionManager instance for atomic
+        redaction operations within the current context.
+        Yields:
+            RedactionManager[RedactionDataT]: Manager instance for redaction operations.
+        """
+        yield RedactionManager(self._context_state)

nat/observability/processor/redaction/span_header_redaction_processor.py ADDED Viewed

@@ -0,0 +1,92 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from collections.abc import Callable
+from typing import Any
+from starlette.datastructures import Headers
+from nat.builder.context import Context
+from nat.observability.processor.redaction.contextual_span_redaction_processor import ContextualSpanRedactionProcessor
+from nat.utils.type_utils import override
+logger = logging.getLogger(__name__)
+class SpanHeaderRedactionProcessor(ContextualSpanRedactionProcessor[dict[str, Any]]):
+    """Processor that redacts the Span based on multiple headers and callback logic.
+    Uses context-scoped atomic updates to avoid redundant callback executions within a single context.
+    Since headers are static per request, the callback result is cached for the entire context using
+    an asynccontextmanager to ensure atomic operations.
+    Args:
+        headers: List of header keys to extract and pass to the callback
+        attributes: List of Span attribute keys to redact
+        callback: Callable that determines if redaction should occur
+        enabled: Whether the processor is enabled (default: True)
+        force_redact: If True, always redact regardless of header checks (default: False)
+        redaction_value: The value to replace redacted attributes with (default: "[REDACTED]")
+    """
+    def __init__(self,
+                 headers: list[str],
+                 attributes: list[str],
+                 callback: Callable[..., Any],
+                 enabled: bool = True,
+                 force_redact: bool = False,
+                 redaction_value: str = "[REDACTED]",
+                 redaction_tag: str | None = None):
+        # Initialize the base class with common parameters
+        super().__init__(attributes=attributes,
+                         callback=callback,
+                         enabled=enabled,
+                         force_redact=force_redact,
+                         redaction_value=redaction_value,
+                         redaction_tag=redaction_tag)
+        # Store header-specific configuration
+        self.headers = headers
+    @override
+    def extract_data_from_context(self) -> dict[str, Any] | None:
+        """Extract header data from the context.
+        Returns:
+            dict[str, Any] | None: Dictionary of header names to values, or None if no headers.
+        """
+        context = Context.get()
+        headers: Headers | None = context.metadata.headers
+        if headers is None or not self.headers:
+            return None
+        header_map: dict[str, Any] = {header: headers.get(header, None) for header in self.headers}
+        return header_map
+    @override
+    def validate_data(self, data: dict[str, Any]) -> bool:
+        """Validate that the extracted headers are suitable for callback execution.
+        Args:
+            data (dict[str, Any]): The extracted header dictionary.
+        Returns:
+            bool: True if headers exist and are not all None, False otherwise.
+        """
+        # Skip callback if no headers were found (all None values)
+        return bool(data) and not all(value is None for value in data.values())

nat/observability/processor/span_tagging_processor.py CHANGED Viewed

@@ -15,6 +15,8 @@
 import logging
 import os
+from collections.abc import Mapping
+from enum import Enum
 from nat.data_models.span import Span
 from nat.observability.processor.processor import Processor
@@ -24,22 +26,20 @@ logger = logging.getLogger(__name__)
 class SpanTaggingProcessor(Processor[Span, Span]):
-    """Processor that tags spans with key-value metadata attributes.
+    """Processor that tags spans with multiple key-value metadata attributes.
     This processor adds custom tags to spans by setting attributes with a configurable prefix.
-    Tags are only applied when both tag_key and tag_value are provided. The processor uses
+    Tags are applied for each key-value pair in the tags dictionary. The processor uses
     a span prefix (configurable via NAT_SPAN_PREFIX environment variable) to namespace
     the tag attributes.
-    Args:
-        tag_key: The key name for the tag to add to spans.
-        tag_value: The value for the tag to add to spans.
-        span_prefix: The prefix to use for tag attributes (default: from NAT_SPAN_PREFIX env var or "nat").
+        Args:
+            tags: Mapping of tag keys to their values. Values can be enums (converted to strings) or strings
+            span_prefix: The prefix to use for tag attributes (default: from NAT_SPAN_PREFIX env var or "nat")
     """
-    def __init__(self, tag_key: str | None = None, tag_value: str | None = None, span_prefix: str | None = None):
-        self.tag_key = tag_key
-        self.tag_value = tag_value
+    def __init__(self, tags: Mapping[str, Enum | str] | None = None, span_prefix: str | None = None):
+        self.tags = tags or {}
         if span_prefix is None:
             span_prefix = os.getenv("NAT_SPAN_PREFIX", "nat").strip() or "nat"
@@ -48,14 +48,21 @@ class SpanTaggingProcessor(Processor[Span, Span]):
     @override
     async def process(self, item: Span) -> Span:
-        """Tag the span with a tag if both tag_key and tag_value are provided.
+        """Tag the span with all configured tags.
         Args:
-            item (Span): The span to tag.
+            item (Span): The span to tag
         Returns:
-            Span: The tagged span.
+            Span: The tagged span with all configured tags applied
         """
-        if self.tag_key and self.tag_value:
-            item.set_attribute(f"{self._span_prefix}.{self.tag_key}", self.tag_value)
+        for tag_key, tag_value in self.tags.items():
+            key = str(tag_key).strip()
+            if not key:
+                continue
+            value_str = str(tag_value.value) if isinstance(tag_value, Enum) else str(tag_value)
+            if value_str == "":
+                continue
+            item.set_attribute(f"{self._span_prefix}.{key}", value_str)
         return item

nat/observability/register.py CHANGED Viewed

@@ -77,6 +77,14 @@ async def console_logging_method(config: ConsoleLoggingMethodConfig, builder: Bu
     level = getattr(logging, config.level.upper(), logging.INFO)
     handler = logging.StreamHandler(stream=sys.stdout)
     handler.setLevel(level)
+    # Set formatter to match the default CLI format
+    formatter = logging.Formatter(
+        fmt="%(asctime)s - %(levelname)-8s - %(name)s:%(lineno)d - %(message)s",
+        datefmt="%Y-%m-%d %H:%M:%S",
+    )
+    handler.setFormatter(formatter)
     yield handler
@@ -95,4 +103,12 @@ async def file_logging_method(config: FileLoggingMethod, builder: Builder):
     level = getattr(logging, config.level.upper(), logging.INFO)
     handler = logging.FileHandler(filename=config.path, mode="a", encoding="utf-8")
     handler.setLevel(level)
+    # Set formatter to match the default CLI format
+    formatter = logging.Formatter(
+        fmt="%(asctime)s - %(levelname)-8s - %(name)s:%(lineno)d - %(message)s",
+        datefmt="%Y-%m-%d %H:%M:%S",
+    )
+    handler.setFormatter(formatter)
     yield handler

nat/profiler/callbacks/langchain_callback_handler.py CHANGED Viewed

@@ -33,6 +33,7 @@ from nat.builder.context import Context
 from nat.builder.framework_enum import LLMFrameworkEnum
 from nat.data_models.intermediate_step import IntermediateStepPayload
 from nat.data_models.intermediate_step import IntermediateStepType
+from nat.data_models.intermediate_step import ServerToolUseSchema
 from nat.data_models.intermediate_step import StreamEventData
 from nat.data_models.intermediate_step import ToolSchema
 from nat.data_models.intermediate_step import TraceMetadata
@@ -48,7 +49,14 @@ def _extract_tools_schema(invocation_params: dict) -> list:
     tools_schema = []
     if invocation_params is not None:
         for tool in invocation_params.get("tools", []):
-            tools_schema.append(ToolSchema(**tool))
+            try:
+                tools_schema.append(ToolSchema(**tool))
+            except Exception:
+                logger.debug(
+                    "Failed to parse tool schema from invocation params: %s. \n This "
+                    "can occur when the LLM server has native tools and can be ignored if "
+                    "using the responses API.",
+                    tool)
     return tools_schema
@@ -93,11 +101,15 @@ class LangchainProfilerHandler(AsyncCallbackHandler, BaseProfilerCallback):
             completion_tokens = usage_metadata.get("output_tokens", 0)
             total_tokens = usage_metadata.get("total_tokens", 0)
-            return TokenUsageBaseModel(
-                prompt_tokens=prompt_tokens,
-                completion_tokens=completion_tokens,
-                total_tokens=total_tokens,
-            )
+            cache_tokens = usage_metadata.get("input_token_details", {}).get("cache_read", 0)
+            reasoning_tokens = usage_metadata.get("output_token_details", {}).get("reasoning", 0)
+            return TokenUsageBaseModel(prompt_tokens=prompt_tokens,
+                                       completion_tokens=completion_tokens,
+                                       total_tokens=total_tokens,
+                                       cached_tokens=cache_tokens,
+                                       reasoning_tokens=reasoning_tokens)
         return TokenUsageBaseModel()
     async def on_llm_start(self, serialized: dict[str, Any], prompts: list[str], **kwargs: Any) -> None:
@@ -213,6 +225,7 @@ class LangchainProfilerHandler(AsyncCallbackHandler, BaseProfilerCallback):
         except IndexError:
             generation = None
+        message = None
         if isinstance(generation, ChatGeneration):
             try:
                 message = generation.message
@@ -232,6 +245,17 @@ class LangchainProfilerHandler(AsyncCallbackHandler, BaseProfilerCallback):
         else:
             llm_text_output = ""
+        tool_outputs_list = []
+        # Check if message.additional_kwargs as tool_outputs indicative of server side tool calling
+        if message and message.additional_kwargs and "tool_outputs" in message.additional_kwargs:
+            tools_outputs = message.additional_kwargs["tool_outputs"]
+            if isinstance(tools_outputs, list):
+                for tool in tools_outputs:
+                    try:
+                        tool_outputs_list.append(ServerToolUseSchema(**tool))
+                    except Exception:
+                        pass
         # update shared state behind lock
         with self._lock:
             usage_stat = IntermediateStepPayload(
@@ -243,7 +267,8 @@ class LangchainProfilerHandler(AsyncCallbackHandler, BaseProfilerCallback):
                 data=StreamEventData(input=self._run_id_to_llm_input.get(str(kwargs.get("run_id", "")), ""),
                                      output=llm_text_output),
                 usage_info=UsageInfo(token_usage=self._extract_token_base_model(usage_metadata)),
-                metadata=TraceMetadata(chat_responses=[generation] if generation else []))
+                metadata=TraceMetadata(chat_responses=[generation] if generation else [],
+                                       tool_outputs=tool_outputs_list if tool_outputs_list else []))
             self.step_manager.push_intermediate_step(usage_stat)

nvidia-nat 1.3.0a20250910__py3-none-any.whl → 1.4.0a20251112__py3-none-any.whl

nvidia-nat 1.3.0a20250910py3-none-any.whl → 1.4.0a20251112py3-none-any.whl