PyPI - nvidia-nat - Versions diffs - 1.3.0a20250910__py3-none-any.whl → 1.4.0a20251112__py3-none-any.whl - Mend

nvidia-nat 1.3.0a20250910py3-none-any.whl → 1.4.0a20251112py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (213) hide show

nat/agent/base.py +13 -8
nat/agent/prompt_optimizer/prompt.py +68 -0
nat/agent/prompt_optimizer/register.py +149 -0
nat/agent/react_agent/agent.py +6 -5
nat/agent/react_agent/register.py +49 -39
nat/agent/reasoning_agent/reasoning_agent.py +17 -15
nat/agent/register.py +2 -0
nat/agent/responses_api_agent/__init__.py +14 -0
nat/agent/responses_api_agent/register.py +126 -0
nat/agent/rewoo_agent/agent.py +304 -117
nat/agent/rewoo_agent/prompt.py +19 -22
nat/agent/rewoo_agent/register.py +51 -38
nat/agent/tool_calling_agent/agent.py +75 -17
nat/agent/tool_calling_agent/register.py +46 -23
nat/authentication/api_key/api_key_auth_provider.py +6 -11
nat/authentication/api_key/api_key_auth_provider_config.py +8 -5
nat/authentication/credential_validator/__init__.py +14 -0
nat/authentication/credential_validator/bearer_token_validator.py +557 -0
nat/authentication/http_basic_auth/http_basic_auth_provider.py +1 -1
nat/authentication/interfaces.py +5 -2
nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +69 -36
nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +2 -1
nat/authentication/oauth2/oauth2_resource_server_config.py +125 -0
nat/builder/builder.py +55 -23
nat/builder/component_utils.py +9 -5
nat/builder/context.py +54 -15
nat/builder/eval_builder.py +14 -9
nat/builder/framework_enum.py +1 -0
nat/builder/front_end.py +1 -1
nat/builder/function.py +370 -0
nat/builder/function_info.py +1 -1
nat/builder/intermediate_step_manager.py +38 -2
nat/builder/workflow.py +5 -0
nat/builder/workflow_builder.py +306 -54
nat/cli/cli_utils/config_override.py +1 -1
nat/cli/commands/info/info.py +16 -6
nat/cli/commands/mcp/__init__.py +14 -0
nat/cli/commands/mcp/mcp.py +986 -0
nat/cli/commands/optimize.py +90 -0
nat/cli/commands/start.py +1 -1
nat/cli/commands/workflow/templates/config.yml.j2 +14 -13
nat/cli/commands/workflow/templates/register.py.j2 +2 -2
nat/cli/commands/workflow/templates/workflow.py.j2 +35 -21
nat/cli/commands/workflow/workflow_commands.py +60 -18
nat/cli/entrypoint.py +15 -11
nat/cli/main.py +3 -0
nat/cli/register_workflow.py +38 -4
nat/cli/type_registry.py +72 -1
nat/control_flow/__init__.py +0 -0
nat/control_flow/register.py +20 -0
nat/control_flow/router_agent/__init__.py +0 -0
nat/control_flow/router_agent/agent.py +329 -0
nat/control_flow/router_agent/prompt.py +48 -0
nat/control_flow/router_agent/register.py +91 -0
nat/control_flow/sequential_executor.py +166 -0
nat/data_models/agent.py +34 -0
nat/data_models/api_server.py +199 -69
nat/data_models/authentication.py +23 -9
nat/data_models/common.py +47 -0
nat/data_models/component.py +2 -0
nat/data_models/component_ref.py +11 -0
nat/data_models/config.py +41 -17
nat/data_models/dataset_handler.py +4 -3
nat/data_models/function.py +34 -0
nat/data_models/function_dependencies.py +8 -0
nat/data_models/intermediate_step.py +9 -1
nat/data_models/llm.py +15 -1
nat/data_models/openai_mcp.py +46 -0
nat/data_models/optimizable.py +208 -0
nat/data_models/optimizer.py +161 -0
nat/data_models/span.py +41 -3
nat/data_models/thinking_mixin.py +2 -2
nat/embedder/azure_openai_embedder.py +2 -1
nat/embedder/nim_embedder.py +3 -2
nat/embedder/openai_embedder.py +3 -2
nat/eval/config.py +1 -1
nat/eval/dataset_handler/dataset_downloader.py +3 -2
nat/eval/dataset_handler/dataset_filter.py +34 -2
nat/eval/evaluate.py +10 -3
nat/eval/evaluator/base_evaluator.py +1 -1
nat/eval/rag_evaluator/evaluate.py +7 -4
nat/eval/register.py +4 -0
nat/eval/runtime_evaluator/__init__.py +14 -0
nat/eval/runtime_evaluator/evaluate.py +123 -0
nat/eval/runtime_evaluator/register.py +100 -0
nat/eval/swe_bench_evaluator/evaluate.py +1 -1
nat/eval/trajectory_evaluator/register.py +1 -1
nat/eval/tunable_rag_evaluator/evaluate.py +1 -1
nat/eval/usage_stats.py +2 -0
nat/eval/utils/output_uploader.py +3 -2
nat/eval/utils/weave_eval.py +17 -3
nat/experimental/decorators/experimental_warning_decorator.py +27 -7
nat/experimental/test_time_compute/functions/execute_score_select_function.py +1 -1
nat/experimental/test_time_compute/functions/plan_select_execute_function.py +7 -3
nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +1 -1
nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +3 -3
nat/experimental/test_time_compute/models/strategy_base.py +2 -2
nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +1 -1
nat/front_ends/console/authentication_flow_handler.py +82 -30
nat/front_ends/console/console_front_end_plugin.py +19 -7
nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +1 -1
nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +52 -17
nat/front_ends/fastapi/dask_client_mixin.py +65 -0
nat/front_ends/fastapi/fastapi_front_end_config.py +25 -3
nat/front_ends/fastapi/fastapi_front_end_plugin.py +140 -3
nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +445 -265
nat/front_ends/fastapi/job_store.py +518 -99
nat/front_ends/fastapi/main.py +11 -19
nat/front_ends/fastapi/message_handler.py +69 -44
nat/front_ends/fastapi/message_validator.py +8 -7
nat/front_ends/fastapi/utils.py +57 -0
nat/front_ends/mcp/introspection_token_verifier.py +73 -0
nat/front_ends/mcp/mcp_front_end_config.py +71 -3
nat/front_ends/mcp/mcp_front_end_plugin.py +85 -21
nat/front_ends/mcp/mcp_front_end_plugin_worker.py +248 -29
nat/front_ends/mcp/memory_profiler.py +320 -0
nat/front_ends/mcp/tool_converter.py +78 -25
nat/front_ends/simple_base/simple_front_end_plugin_base.py +3 -1
nat/llm/aws_bedrock_llm.py +21 -8
nat/llm/azure_openai_llm.py +14 -5
nat/llm/litellm_llm.py +80 -0
nat/llm/nim_llm.py +23 -9
nat/llm/openai_llm.py +19 -7
nat/llm/register.py +4 -0
nat/llm/utils/thinking.py +1 -1
nat/observability/exporter/base_exporter.py +1 -1
nat/observability/exporter/processing_exporter.py +29 -55
nat/observability/exporter/span_exporter.py +43 -15
nat/observability/exporter_manager.py +2 -2
nat/observability/mixin/redaction_config_mixin.py +5 -4
nat/observability/mixin/tagging_config_mixin.py +26 -14
nat/observability/mixin/type_introspection_mixin.py +420 -107
nat/observability/processor/batching_processor.py +1 -1
nat/observability/processor/processor.py +3 -0
nat/observability/processor/redaction/__init__.py +24 -0
nat/observability/processor/redaction/contextual_redaction_processor.py +125 -0
nat/observability/processor/redaction/contextual_span_redaction_processor.py +66 -0
nat/observability/processor/redaction/redaction_processor.py +177 -0
nat/observability/processor/redaction/span_header_redaction_processor.py +92 -0
nat/observability/processor/span_tagging_processor.py +21 -14
nat/observability/register.py +16 -0
nat/profiler/callbacks/langchain_callback_handler.py +32 -7
nat/profiler/callbacks/llama_index_callback_handler.py +36 -2
nat/profiler/callbacks/token_usage_base_model.py +2 -0
nat/profiler/decorators/framework_wrapper.py +61 -9
nat/profiler/decorators/function_tracking.py +35 -3
nat/profiler/forecasting/models/linear_model.py +1 -1
nat/profiler/forecasting/models/random_forest_regressor.py +1 -1
nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +1 -1
nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +1 -1
nat/profiler/parameter_optimization/__init__.py +0 -0
nat/profiler/parameter_optimization/optimizable_utils.py +93 -0
nat/profiler/parameter_optimization/optimizer_runtime.py +67 -0
nat/profiler/parameter_optimization/parameter_optimizer.py +189 -0
nat/profiler/parameter_optimization/parameter_selection.py +107 -0
nat/profiler/parameter_optimization/pareto_visualizer.py +460 -0
nat/profiler/parameter_optimization/prompt_optimizer.py +384 -0
nat/profiler/parameter_optimization/update_helpers.py +66 -0
nat/profiler/utils.py +3 -1
nat/registry_handlers/pypi/register_pypi.py +5 -3
nat/registry_handlers/rest/register_rest.py +5 -3
nat/retriever/milvus/retriever.py +1 -1
nat/retriever/nemo_retriever/register.py +2 -1
nat/runtime/loader.py +1 -1
nat/runtime/runner.py +111 -6
nat/runtime/session.py +49 -3
nat/settings/global_settings.py +2 -2
nat/tool/chat_completion.py +4 -1
nat/tool/code_execution/code_sandbox.py +3 -6
nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +19 -32
nat/tool/code_execution/local_sandbox/local_sandbox_server.py +6 -1
nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +2 -0
nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +10 -4
nat/tool/datetime_tools.py +1 -1
nat/tool/github_tools.py +450 -0
nat/tool/memory_tools/add_memory_tool.py +3 -3
nat/tool/memory_tools/delete_memory_tool.py +3 -4
nat/tool/memory_tools/get_memory_tool.py +4 -4
nat/tool/register.py +2 -7
nat/tool/server_tools.py +15 -2
nat/utils/__init__.py +76 -0
nat/utils/callable_utils.py +70 -0
nat/utils/data_models/schema_validator.py +1 -1
nat/utils/decorators.py +210 -0
nat/utils/exception_handlers/automatic_retries.py +278 -72
nat/utils/io/yaml_tools.py +73 -3
nat/utils/log_levels.py +25 -0
nat/utils/responses_api.py +26 -0
nat/utils/string_utils.py +16 -0
nat/utils/type_converter.py +12 -3
nat/utils/type_utils.py +6 -2
nvidia_nat-1.4.0a20251112.dist-info/METADATA +197 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/RECORD +199 -165
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/entry_points.txt +1 -0
nat/cli/commands/info/list_mcp.py +0 -461
nat/data_models/temperature_mixin.py +0 -43
nat/data_models/top_p_mixin.py +0 -43
nat/observability/processor/header_redaction_processor.py +0 -123
nat/observability/processor/redaction_processor.py +0 -77
nat/tool/code_execution/test_code_execution_sandbox.py +0 -414
nat/tool/github_tools/create_github_commit.py +0 -133
nat/tool/github_tools/create_github_issue.py +0 -87
nat/tool/github_tools/create_github_pr.py +0 -106
nat/tool/github_tools/get_github_file.py +0 -106
nat/tool/github_tools/get_github_issue.py +0 -166
nat/tool/github_tools/get_github_pr.py +0 -256
nat/tool/github_tools/update_github_issue.py +0 -100
nvidia_nat-1.3.0a20250910.dist-info/METADATA +0 -373
/nat/{tool/github_tools → agent/prompt_optimizer}/__init__.py +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/WHEEL +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/licenses/LICENSE-3rd-party.txt +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/licenses/LICENSE.md +0 -0
{nvidia_nat-1.3.0a20250910.dist-info → nvidia_nat-1.4.0a20251112.dist-info}/top_level.txt +0 -0

nat/profiler/callbacks/llama_index_callback_handler.py CHANGED Viewed

@@ -30,6 +30,7 @@ from nat.builder.context import Context
 from nat.builder.framework_enum import LLMFrameworkEnum
 from nat.data_models.intermediate_step import IntermediateStepPayload
 from nat.data_models.intermediate_step import IntermediateStepType
+from nat.data_models.intermediate_step import ServerToolUseSchema
 from nat.data_models.intermediate_step import StreamEventData
 from nat.data_models.intermediate_step import TraceMetadata
 from nat.data_models.intermediate_step import UsageInfo
@@ -64,6 +65,26 @@ class LlamaIndexProfilerHandler(BaseCallbackHandler, BaseProfilerCallback):
         self._run_id_to_tool_input = {}
         self._run_id_to_timestamp = {}
+    @staticmethod
+    def _extract_token_usage(response: ChatResponse) -> TokenUsageBaseModel:
+        token_usage = TokenUsageBaseModel()
+        try:
+            if response and response.additional_kwargs and "usage" in response.additional_kwargs:
+                usage = response.additional_kwargs["usage"] if "usage" in response.additional_kwargs else {}
+                token_usage.prompt_tokens = usage.input_tokens if hasattr(usage, "input_tokens") else 0
+                token_usage.completion_tokens = usage.output_tokens if hasattr(usage, "output_tokens") else 0
+                if hasattr(usage, "input_tokens_details") and hasattr(usage.input_tokens_details, "cached_tokens"):
+                    token_usage.cached_tokens = usage.input_tokens_details.cached_tokens
+                if hasattr(usage, "output_tokens_details") and hasattr(usage.output_tokens_details, "reasoning_tokens"):
+                    token_usage.reasoning_tokens = usage.output_tokens_details.reasoning_tokens
+        except Exception as e:
+            logger.debug("Error extracting token usage: %s", e, exc_info=True)
+        return token_usage
     def on_event_start(
         self,
         event_type: CBEventType,
@@ -167,6 +188,18 @@ class LlamaIndexProfilerHandler(BaseCallbackHandler, BaseProfilerCallback):
                 except Exception as e:
                     logger.exception("Error getting model name: %s", e)
+                # Append usage data to NAT usage stats
+                tool_outputs_list = []
+                # Check if message.additional_kwargs as tool_outputs indicative of server side tool calling
+                if response and response.additional_kwargs and "built_in_tool_calls" in response.additional_kwargs:
+                    tools_outputs = response.additional_kwargs["built_in_tool_calls"]
+                    if isinstance(tools_outputs, list):
+                        for tool in tools_outputs:
+                            try:
+                                tool_outputs_list.append(ServerToolUseSchema(**tool.model_dump()))
+                            except Exception:
+                                pass
                 # Append usage data to NAT usage stats
                 with self._lock:
                     stats = IntermediateStepPayload(
@@ -176,8 +209,9 @@ class LlamaIndexProfilerHandler(BaseCallbackHandler, BaseProfilerCallback):
                         name=model_name,
                         UUID=event_id,
                         data=StreamEventData(input=self._run_id_to_llm_input.get(event_id), output=llm_text_output),
-                        metadata=TraceMetadata(chat_responses=response.message if response.message else None),
-                        usage_info=UsageInfo(token_usage=TokenUsageBaseModel(**response.additional_kwargs)))
+                        metadata=TraceMetadata(chat_responses=response.message if response.message else None,
+                                               tool_outputs=tool_outputs_list if tool_outputs_list else []),
+                        usage_info=UsageInfo(token_usage=self._extract_token_usage(response)))
                     self.step_manager.push_intermediate_step(stats)
         elif event_type == CBEventType.FUNCTION_CALL and payload:

nat/profiler/callbacks/token_usage_base_model.py CHANGED Viewed

@@ -24,4 +24,6 @@ class TokenUsageBaseModel(BaseModel):
     prompt_tokens: int = Field(default=0, description="Number of tokens in the prompt.")
     completion_tokens: int = Field(default=0, description="Number of tokens in the completion.")
+    cached_tokens: int = Field(default=0, description="Number of tokens read from cache.")
+    reasoning_tokens: int = Field(default=0, description="Number of tokens used for reasoning.")
     total_tokens: int = Field(default=0, description="Number of tokens total.")

nat/profiler/decorators/framework_wrapper.py CHANGED Viewed

@@ -17,6 +17,7 @@ from __future__ import annotations
 import functools
 import logging
+from collections.abc import AsyncIterator
 from collections.abc import Callable
 from contextlib import AbstractAsyncContextManager as AsyncContextManager
 from contextlib import asynccontextmanager
@@ -32,35 +33,55 @@ _library_instrumented = {
     "crewai": False,
     "semantic_kernel": False,
     "agno": False,
+    "adk": False,
 }
 callback_handler_var: ContextVar[Any | None] = ContextVar("callback_handler_var", default=None)
 def set_framework_profiler_handler(
-    workflow_llms: dict = None,
-    frameworks: list[LLMFrameworkEnum] = None,
+    workflow_llms: dict | None = None,
+    frameworks: list[LLMFrameworkEnum] | None = None,
 ) -> Callable[[Callable[..., AsyncContextManager[Any]]], Callable[..., AsyncContextManager[Any]]]:
     """
     Decorator that wraps an async context manager function to set up framework-specific profiling.
+    Args:
+        workflow_llms (dict | None): A dictionary of workflow LLM configurations.
+        frameworks (list[LLMFrameworkEnum] | None): A list of LLM frameworks used in the workflow functions.
+    Returns:
+        Callable[[Callable[..., AsyncContextManager[Any]]], Callable[..., AsyncContextManager[Any]]]:
+        A decorator that wraps the original function with profiling setup.
     """
     def decorator(func: Callable[..., AsyncContextManager[Any]]) -> Callable[..., AsyncContextManager[Any]]:
+        """The actual decorator that wraps the function.
+        Args:
+            func (Callable[..., AsyncContextManager[Any]]): The function to wrap.
+        Returns:
+            Callable[..., AsyncContextManager[Any]]: The wrapped function.
+        """
         @functools.wraps(func)
         @asynccontextmanager
         async def wrapper(workflow_config, builder):
-            if LLMFrameworkEnum.LANGCHAIN in frameworks and not _library_instrumented["langchain"]:
-                from langchain_core.tracers.context import register_configure_hook
+            if LLMFrameworkEnum.LANGCHAIN in frameworks:
+                # Always set a fresh handler in the current context so callbacks
+                # route to the active run. Only register the hook once globally.
                 from nat.profiler.callbacks.langchain_callback_handler import LangchainProfilerHandler
                 handler = LangchainProfilerHandler()
                 callback_handler_var.set(handler)
-                register_configure_hook(callback_handler_var, inheritable=True)
-                _library_instrumented["langchain"] = True
-                logger.debug("LangChain/LangGraph callback handler registered")
+                if not _library_instrumented["langchain"]:
+                    from langchain_core.tracers.context import register_configure_hook
+                    register_configure_hook(callback_handler_var, inheritable=True)
+                    _library_instrumented["langchain"] = True
+                    logger.debug("LangChain/LangGraph callback hook registered")
             if LLMFrameworkEnum.LLAMA_INDEX in frameworks:
                 from llama_index.core import Settings
@@ -96,6 +117,20 @@ def set_framework_profiler_handler(
                 _library_instrumented["agno"] = True
                 logger.info("Agno callback handler registered")
+            if LLMFrameworkEnum.ADK in frameworks and not _library_instrumented["adk"]:
+                try:
+                    from nat.plugins.adk.adk_callback_handler import ADKProfilerHandler
+                except ImportError as e:
+                    logger.warning(
+                        "ADK profiler not available. " +
+                        "Install NAT with ADK extras: pip install \"nvidia-nat[adk]\". Error: %s",
+                        e)
+                else:
+                    handler = ADKProfilerHandler()
+                    handler.instrument()
+                    _library_instrumented["adk"] = True
+                    logger.debug("ADK callback handler registered")
             # IMPORTANT: actually call the wrapped function as an async context manager
             async with func(workflow_config, builder) as result:
                 yield result
@@ -114,11 +149,28 @@ def chain_wrapped_build_fn(
     Convert an original build function into an async context manager that
     wraps it with a single call to set_framework_profiler_handler, passing
     all frameworks at once.
+    Args:
+        original_build_fn (Callable[..., AsyncContextManager]): The original build function to wrap.
+        workflow_llms (dict): A dictionary of workflow LLM configurations.
+        function_frameworks (list[LLMFrameworkEnum]): A list of LLM frameworks used in the workflow functions.
+    Returns:
+        Callable[..., AsyncContextManager]: The wrapped build function.
     """
     # Define a base async context manager that simply calls the original build function.
     @asynccontextmanager
-    async def base_fn(*args, **kwargs):
+    async def base_fn(*args, **kwargs) -> AsyncIterator[Any]:
+        """Base async context manager that calls the original build function.
+        Args:
+            *args: Positional arguments to pass to the original build function.
+            **kwargs: Keyword arguments to pass to the original build function.
+        Yields:
+            The result of the original build function.
+        """
         async with original_build_fn(*args, **kwargs) as w:
             yield w

nat/profiler/decorators/function_tracking.py CHANGED Viewed

@@ -18,7 +18,9 @@ import inspect
 import uuid
 from collections.abc import Callable
 from typing import Any
+from typing import TypeVar
 from typing import cast
+from typing import overload
 from pydantic import BaseModel
@@ -38,10 +40,10 @@ def _serialize_data(obj: Any) -> Any:
     if isinstance(obj, dict):
         return {str(k): _serialize_data(v) for k, v in obj.items()}
-    if isinstance(obj, (list, tuple, set)):
+    if isinstance(obj, list | tuple | set):
         return [_serialize_data(item) for item in obj]
-    if isinstance(obj, (str, int, float, bool, type(None))):
+    if isinstance(obj, str | int | float | bool | type(None)):
         return obj
     # Fallback
@@ -77,7 +79,24 @@ def push_intermediate_step(step_manager: IntermediateStepManager,
     step_manager.push_intermediate_step(payload)
-def track_function(func: Any = None, *, metadata: dict[str, Any] | None = None):
+# Type variable for overloads
+F = TypeVar('F', bound=Callable[..., Any])
+# Overloads for different function types
+@overload
+def track_function(func: F, *, metadata: dict[str, Any] | None = None) -> F:
+    """Overload for when a function is passed directly."""
+    ...
+@overload
+def track_function(*, metadata: dict[str, Any] | None = None) -> Callable[[F], F]:
+    """Overload for decorator factory usage (when called with parentheses)."""
+    ...
+def track_function(func: Any = None, *, metadata: dict[str, Any] | None = None) -> Any:
     """
     Decorator that can wrap any type of function (sync, async, generator,
     async generator) and executes "tracking logic" around it.
@@ -256,6 +275,19 @@ def track_function(func: Any = None, *, metadata: dict[str, Any] | None = None):
     return sync_wrapper
+# Overloads for track_unregistered_function
+@overload
+def track_unregistered_function(func: F, *, name: str | None = None, metadata: dict[str, Any] | None = None) -> F:
+    """Overload for when a function is passed directly."""
+    ...
+@overload
+def track_unregistered_function(*, name: str | None = None, metadata: dict[str, Any] | None = None) -> Callable[[F], F]:
+    """Overload for decorator factory usage (when called with parentheses)."""
+    ...
 def track_unregistered_function(func: Callable[..., Any] | None = None,
                                 *,
                                 name: str | None = None,

nat/profiler/forecasting/models/linear_model.py CHANGED Viewed

@@ -36,7 +36,7 @@ class LinearModel(ForecastingBaseModel):
         except ImportError:
             logger.error(
                 "scikit-learn is not installed. Please install scikit-learn to use the LinearModel "
-                "profiling model or install `nvidia-nat[profiler]` to install all necessary profiling packages.")
+                "profiling model or install \"nvidia-nat[profiler]\" to install all necessary profiling packages.")
             raise

nat/profiler/forecasting/models/random_forest_regressor.py CHANGED Viewed

@@ -36,7 +36,7 @@ class RandomForestModel(ForecastingBaseModel):
         except ImportError:
             logger.error(
                 "scikit-learn is not installed. Please install scikit-learn to use the RandomForest "
-                "profiling model or install `nvidia-nat[profiler]` to install all necessary profiling packages.")
+                "profiling model or install \"nvidia-nat[profiler]\" to install all necessary profiling packages.")
             raise

nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py CHANGED Viewed

@@ -304,7 +304,7 @@ def save_gantt_chart(all_nodes: list[CallNode], output_path: str) -> None:
         import matplotlib.pyplot as plt
     except ImportError:
         logger.error("matplotlib is not installed. Please install matplotlib to use generate plots for the profiler "
-                     "or install `nvidia-nat[profiler]` to install all necessary profiling packages.")
+                     "or install \"nvidia-nat[profiler]\" to install all necessary profiling packages.")
         raise

nat/profiler/inference_optimization/experimental/prefix_span_analysis.py CHANGED Viewed

@@ -212,7 +212,7 @@ def run_prefixspan(sequences_map: dict[int, list[PrefixCallNode]],
         from prefixspan import PrefixSpan
     except ImportError:
         logger.error("prefixspan is not installed. Please install prefixspan to run the prefix analysis in the "
-                     "profiler or install `nvidia-nat[profiler]` to install all necessary profiling packages.")
+                     "profiler or install \"nvidia-nat[profiler]\" to install all necessary profiling packages.")
         raise

nat/profiler/parameter_optimization/__init__.py ADDED Viewed

File without changes

nat/profiler/parameter_optimization/optimizable_utils.py ADDED Viewed

@@ -0,0 +1,93 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from typing import get_args
+from typing import get_origin
+from pydantic import BaseModel
+from nat.data_models.optimizable import SearchSpace
+logger = logging.getLogger(__name__)
+def walk_optimizables(obj: BaseModel, path: str = "") -> dict[str, SearchSpace]:
+    """
+    Recursively build ``{flattened.path: SearchSpace}`` for every optimizable
+    field inside *obj*.
+    * Honors ``optimizable_params`` on any model that mixes in
+      ``OptimizableMixin`` – only listed fields are kept.
+    * If a model contains optimizable fields **but** omits
+      ``optimizable_params``, we emit a warning and skip them.
+    """
+    spaces: dict[str, SearchSpace] = {}
+    allowed_params_raw = getattr(obj, "optimizable_params", None)
+    allowed_params = set(allowed_params_raw) if allowed_params_raw is not None else None
+    overrides = getattr(obj, "search_space", {}) or {}
+    has_optimizable_flag = False
+    for name, fld in obj.model_fields.items():
+        full = f"{path}.{name}" if path else name
+        extra = fld.json_schema_extra or {}
+        is_field_optimizable = extra.get("optimizable", False) or name in overrides
+        has_optimizable_flag = has_optimizable_flag or is_field_optimizable
+        # honour allow-list
+        if allowed_params is not None and name not in allowed_params:
+            continue
+        # 1. plain optimizable field or override from config
+        if is_field_optimizable:
+            space = overrides.get(name, extra.get("search_space"))
+            if space is None:
+                logger.error(
+                    "Field %s is marked optimizable but no search space was provided.",
+                    full,
+                )
+                raise ValueError(f"Field {full} is marked optimizable but no search space was provided")
+            spaces[full] = space
+        value = getattr(obj, name, None)
+        # 2. nested BaseModel
+        if isinstance(value, BaseModel):
+            spaces.update(walk_optimizables(value, full))
+        # 3. dict[str, BaseModel] container
+        elif isinstance(value, dict):
+            for key, subval in value.items():
+                if isinstance(subval, BaseModel):
+                    spaces.update(walk_optimizables(subval, f"{full}.{key}"))
+        # 4. static-type fallback for class-level annotations
+        elif isinstance(obj, type):
+            ann = fld.annotation
+            if get_origin(ann) in (dict, dict):
+                _, val_t = get_args(ann) or (None, None)
+                if isinstance(val_t, type) and issubclass(val_t, BaseModel):
+                    if allowed_params is None or name in allowed_params:
+                        spaces[f"{full}.*"] = SearchSpace(low=None, high=None)  # sentinel
+    if allowed_params is None and has_optimizable_flag:
+        logger.warning(
+            "Model %s contains optimizable fields but no `optimizable_params` "
+            "were defined; these fields will be ignored.",
+            obj.__class__.__name__,
+        )
+    return spaces

nat/profiler/parameter_optimization/optimizer_runtime.py ADDED Viewed

@@ -0,0 +1,67 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from pydantic import BaseModel
+from nat.data_models.optimizer import OptimizerRunConfig
+from nat.experimental.decorators.experimental_warning_decorator import experimental
+from nat.profiler.parameter_optimization.optimizable_utils import walk_optimizables
+from nat.profiler.parameter_optimization.parameter_optimizer import optimize_parameters
+from nat.profiler.parameter_optimization.prompt_optimizer import optimize_prompts
+from nat.runtime.loader import load_config
+logger = logging.getLogger(__name__)
+@experimental(feature_name="Optimizer")
+async def optimize_config(opt_run_config: OptimizerRunConfig):
+    """Entry-point called by the CLI or runtime."""
+    # ---------------- 1. load / normalise ---------------- #
+    if not isinstance(opt_run_config.config_file, BaseModel):
+        from nat.data_models.config import Config  # guarded import
+        base_cfg: Config = load_config(config_file=opt_run_config.config_file)
+    else:
+        base_cfg = opt_run_config.config_file  # already validated
+    # ---------------- 2. discover search space ----------- #
+    full_space = walk_optimizables(base_cfg)
+    if not full_space:
+        logger.warning("No optimizable parameters found in the configuration. "
+                       "Skipping optimization.")
+        return base_cfg
+    # ---------------- 3. numeric / enum tuning ----------- #
+    tuned_cfg = base_cfg
+    if base_cfg.optimizer.numeric.enabled:
+        tuned_cfg = optimize_parameters(
+            base_cfg=base_cfg,
+            full_space=full_space,
+            optimizer_config=base_cfg.optimizer,
+            opt_run_config=opt_run_config,
+        )
+    # ---------------- 4. prompt optimization ------------- #
+    if base_cfg.optimizer.prompt.enabled:
+        await optimize_prompts(
+            base_cfg=tuned_cfg,
+            full_space=full_space,
+            optimizer_config=base_cfg.optimizer,
+            opt_run_config=opt_run_config,
+        )
+    logger.info("All optimization phases complete.")
+    return tuned_cfg

nat/profiler/parameter_optimization/parameter_optimizer.py ADDED Viewed

@@ -0,0 +1,189 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import asyncio
+import logging
+from collections.abc import Mapping as Dict
+import optuna
+import yaml
+from nat.data_models.config import Config
+from nat.data_models.optimizable import SearchSpace
+from nat.data_models.optimizer import OptimizerConfig
+from nat.data_models.optimizer import OptimizerRunConfig
+from nat.data_models.optimizer import SamplerType
+from nat.eval.evaluate import EvaluationRun
+from nat.eval.evaluate import EvaluationRunConfig
+from nat.experimental.decorators.experimental_warning_decorator import experimental
+from nat.profiler.parameter_optimization.parameter_selection import pick_trial
+from nat.profiler.parameter_optimization.update_helpers import apply_suggestions
+logger = logging.getLogger(__name__)
+@experimental(feature_name="Optimizer")
+def optimize_parameters(
+    *,
+    base_cfg: Config,
+    full_space: Dict[str, SearchSpace],
+    optimizer_config: OptimizerConfig,
+    opt_run_config: OptimizerRunConfig,
+) -> Config:
+    """Tune all *non-prompt* hyper-parameters and persist the best config."""
+    space = {k: v for k, v in full_space.items() if not v.is_prompt}
+    # Ensure output_path is not None
+    if optimizer_config.output_path is None:
+        raise ValueError("optimizer_config.output_path cannot be None")
+    out_dir = optimizer_config.output_path
+    out_dir.mkdir(parents=True, exist_ok=True)
+    # Ensure eval_metrics is not None
+    if optimizer_config.eval_metrics is None:
+        raise ValueError("optimizer_config.eval_metrics cannot be None")
+    metric_cfg = optimizer_config.eval_metrics
+    directions = [v.direction for v in metric_cfg.values()]
+    eval_metrics = [v.evaluator_name for v in metric_cfg.values()]
+    weights = [v.weight for v in metric_cfg.values()]
+    # Create appropriate sampler based on configuration
+    sampler_type = optimizer_config.numeric.sampler
+    if sampler_type == SamplerType.GRID:
+        # For grid search, convert the existing space to value sequences
+        grid_search_space = {param_name: search_space.to_grid_values() for param_name, search_space in space.items()}
+        sampler = optuna.samplers.GridSampler(grid_search_space)
+        logger.info("Using Grid sampler for numeric optimization")
+    else:
+        # None or BAYESIAN: let Optuna choose defaults
+        sampler = None
+        logger.info(
+            "Using Optuna default sampler types: TPESampler for single-objective, NSGAIISampler for multi-objective")
+    study = optuna.create_study(directions=directions, sampler=sampler)
+    # Create output directory for intermediate files
+    out_dir = optimizer_config.output_path
+    out_dir.mkdir(parents=True, exist_ok=True)
+    async def _run_eval(runner: EvaluationRun):
+        return await runner.run_and_evaluate()
+    def _objective(trial: optuna.Trial):
+        reps = max(1, getattr(optimizer_config, "reps_per_param_set", 1))
+        # build trial config
+        suggestions = {p: spec.suggest(trial, p) for p, spec in space.items()}
+        cfg_trial = apply_suggestions(base_cfg, suggestions)
+        async def _single_eval(trial_idx: int) -> list[float]:  # noqa: ARG001
+            eval_cfg = EvaluationRunConfig(
+                config_file=cfg_trial,
+                dataset=opt_run_config.dataset,
+                result_json_path=opt_run_config.result_json_path,
+                endpoint=opt_run_config.endpoint,
+                endpoint_timeout=opt_run_config.endpoint_timeout,
+            )
+            scores = await _run_eval(EvaluationRun(config=eval_cfg))
+            values = []
+            for metric_name in eval_metrics:
+                metric = next(r[1] for r in scores.evaluation_results if r[0] == metric_name)
+                values.append(metric.average_score)
+            return values
+        # Create tasks for all evaluations
+        async def _run_all_evals():
+            tasks = [_single_eval(i) for i in range(reps)]
+            return await asyncio.gather(*tasks)
+        # Calculate padding width based on total number of trials
+        trial_id_width = len(str(max(0, optimizer_config.numeric.n_trials - 1)))
+        trial_id_padded = f"{trial.number:0{trial_id_width}d}"
+        with (out_dir / f"config_numeric_trial_{trial_id_padded}.yml").open("w") as fh:
+            yaml.dump(cfg_trial.model_dump(), fh)
+        all_scores = asyncio.run(_run_all_evals())
+        # Persist raw per‑repetition scores so they appear in `trials_dataframe`.
+        trial.set_user_attr("rep_scores", all_scores)
+        return [sum(run[i] for run in all_scores) / reps for i in range(len(eval_metrics))]
+    logger.info("Starting numeric / enum parameter optimization...")
+    study.optimize(_objective, n_trials=optimizer_config.numeric.n_trials)
+    logger.info("Numeric optimization finished")
+    best_params = pick_trial(
+        study=study,
+        mode=optimizer_config.multi_objective_combination_mode,
+        weights=weights,
+    ).params
+    tuned_cfg = apply_suggestions(base_cfg, best_params)
+    # Save final results (out_dir already created and defined above)
+    with (out_dir / "optimized_config.yml").open("w") as fh:
+        yaml.dump(tuned_cfg.model_dump(mode='json'), fh)
+    with (out_dir / "trials_dataframe_params.csv").open("w") as fh:
+        # Export full trials DataFrame (values, params, timings, etc.).
+        df = study.trials_dataframe()
+        # Rename values_X columns to actual metric names
+        metric_names = list(metric_cfg.keys())
+        rename_mapping = {}
+        for i, metric_name in enumerate(metric_names):
+            old_col = f"values_{i}"
+            if old_col in df.columns:
+                rename_mapping[old_col] = f"values_{metric_name}"
+        if rename_mapping:
+            df = df.rename(columns=rename_mapping)
+        # Normalise rep_scores column naming for convenience.
+        if "user_attrs_rep_scores" in df.columns and "rep_scores" not in df.columns:
+            df = df.rename(columns={"user_attrs_rep_scores": "rep_scores"})
+        elif "user_attrs" in df.columns and "rep_scores" not in df.columns:
+            # Some Optuna versions return a dict in a single user_attrs column.
+            df["rep_scores"] = df["user_attrs"].apply(lambda d: d.get("rep_scores") if isinstance(d, dict) else None)
+            df = df.drop(columns=["user_attrs"])
+        # Get Pareto optimal trial numbers from Optuna study
+        pareto_trials = study.best_trials
+        pareto_trial_numbers = {trial.number for trial in pareto_trials}
+        # Add boolean column indicating if trial is Pareto optimal
+        df["pareto_optimal"] = df["number"].isin(pareto_trial_numbers)
+        df.to_csv(fh, index=False)
+    # Generate Pareto front visualizations
+    try:
+        from nat.profiler.parameter_optimization.pareto_visualizer import create_pareto_visualization
+        logger.info("Generating Pareto front visualizations...")
+        create_pareto_visualization(
+            data_source=study,
+            metric_names=eval_metrics,
+            directions=directions,
+            output_dir=out_dir / "plots",
+            title_prefix="Parameter Optimization",
+            show_plots=False  # Don't show plots in automated runs
+        )
+        logger.info("Pareto visualizations saved to: %s", out_dir / "plots")
+    except ImportError as ie:
+        logger.warning("Could not import visualization dependencies: %s. "
+                       "Have you installed nvidia-nat-profiling?",
+                       ie)
+    except Exception as e:
+        logger.warning("Failed to generate visualizations: %s", e)
+    return tuned_cfg

nvidia-nat 1.3.0a20250910__py3-none-any.whl → 1.4.0a20251112__py3-none-any.whl

nvidia-nat 1.3.0a20250910py3-none-any.whl → 1.4.0a20251112py3-none-any.whl