PyPI - nvidia-nat - Versions diffs - 1.3.0.dev2__py3-none-any.whl → 1.3.0rc2__py3-none-any.whl - Mend

nvidia-nat 1.3.0.dev2py3-none-any.whl → 1.3.0rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (250) hide show

aiq/__init__.py +2 -2
nat/agent/base.py +24 -15
nat/agent/dual_node.py +9 -4
nat/agent/prompt_optimizer/prompt.py +68 -0
nat/agent/prompt_optimizer/register.py +149 -0
nat/agent/react_agent/agent.py +79 -47
nat/agent/react_agent/register.py +50 -22
nat/agent/reasoning_agent/reasoning_agent.py +11 -9
nat/agent/register.py +1 -1
nat/agent/rewoo_agent/agent.py +326 -148
nat/agent/rewoo_agent/prompt.py +19 -22
nat/agent/rewoo_agent/register.py +54 -27
nat/agent/tool_calling_agent/agent.py +84 -28
nat/agent/tool_calling_agent/register.py +51 -28
nat/authentication/api_key/api_key_auth_provider.py +2 -2
nat/authentication/credential_validator/bearer_token_validator.py +557 -0
nat/authentication/http_basic_auth/http_basic_auth_provider.py +1 -1
nat/authentication/interfaces.py +5 -2
nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +69 -36
nat/authentication/oauth2/oauth2_resource_server_config.py +124 -0
nat/authentication/register.py +0 -1
nat/builder/builder.py +56 -24
nat/builder/component_utils.py +9 -5
nat/builder/context.py +68 -17
nat/builder/eval_builder.py +16 -11
nat/builder/framework_enum.py +1 -0
nat/builder/front_end.py +1 -1
nat/builder/function.py +378 -8
nat/builder/function_base.py +3 -3
nat/builder/function_info.py +6 -8
nat/builder/user_interaction_manager.py +2 -2
nat/builder/workflow.py +13 -1
nat/builder/workflow_builder.py +281 -76
nat/cli/cli_utils/config_override.py +2 -2
nat/cli/commands/evaluate.py +1 -1
nat/cli/commands/info/info.py +16 -6
nat/cli/commands/info/list_channels.py +1 -1
nat/cli/commands/info/list_components.py +7 -8
nat/cli/commands/mcp/__init__.py +14 -0
nat/cli/commands/mcp/mcp.py +986 -0
nat/cli/commands/object_store/__init__.py +14 -0
nat/cli/commands/object_store/object_store.py +227 -0
nat/cli/commands/optimize.py +90 -0
nat/cli/commands/registry/publish.py +2 -2
nat/cli/commands/registry/pull.py +2 -2
nat/cli/commands/registry/remove.py +2 -2
nat/cli/commands/registry/search.py +15 -17
nat/cli/commands/start.py +16 -5
nat/cli/commands/uninstall.py +1 -1
nat/cli/commands/workflow/templates/config.yml.j2 +14 -13
nat/cli/commands/workflow/templates/pyproject.toml.j2 +4 -1
nat/cli/commands/workflow/templates/register.py.j2 +2 -3
nat/cli/commands/workflow/templates/workflow.py.j2 +35 -21
nat/cli/commands/workflow/workflow_commands.py +62 -22
nat/cli/entrypoint.py +8 -10
nat/cli/main.py +3 -0
nat/cli/register_workflow.py +38 -4
nat/cli/type_registry.py +75 -6
nat/control_flow/__init__.py +0 -0
nat/control_flow/register.py +20 -0
nat/control_flow/router_agent/__init__.py +0 -0
nat/control_flow/router_agent/agent.py +329 -0
nat/control_flow/router_agent/prompt.py +48 -0
nat/control_flow/router_agent/register.py +91 -0
nat/control_flow/sequential_executor.py +166 -0
nat/data_models/agent.py +34 -0
nat/data_models/api_server.py +74 -66
nat/data_models/authentication.py +23 -9
nat/data_models/common.py +1 -1
nat/data_models/component.py +2 -0
nat/data_models/component_ref.py +11 -0
nat/data_models/config.py +41 -17
nat/data_models/dataset_handler.py +1 -1
nat/data_models/discovery_metadata.py +4 -4
nat/data_models/evaluate.py +4 -1
nat/data_models/function.py +34 -0
nat/data_models/function_dependencies.py +14 -6
nat/data_models/gated_field_mixin.py +242 -0
nat/data_models/intermediate_step.py +3 -3
nat/data_models/optimizable.py +119 -0
nat/data_models/optimizer.py +149 -0
nat/data_models/span.py +41 -3
nat/data_models/swe_bench_model.py +1 -1
nat/data_models/temperature_mixin.py +44 -0
nat/data_models/thinking_mixin.py +86 -0
nat/data_models/top_p_mixin.py +44 -0
nat/embedder/nim_embedder.py +1 -1
nat/embedder/openai_embedder.py +1 -1
nat/embedder/register.py +0 -1
nat/eval/config.py +3 -1
nat/eval/dataset_handler/dataset_handler.py +71 -7
nat/eval/evaluate.py +86 -31
nat/eval/evaluator/base_evaluator.py +1 -1
nat/eval/evaluator/evaluator_model.py +13 -0
nat/eval/intermediate_step_adapter.py +1 -1
nat/eval/rag_evaluator/evaluate.py +2 -2
nat/eval/rag_evaluator/register.py +3 -3
nat/eval/register.py +4 -1
nat/eval/remote_workflow.py +3 -3
nat/eval/runtime_evaluator/__init__.py +14 -0
nat/eval/runtime_evaluator/evaluate.py +123 -0
nat/eval/runtime_evaluator/register.py +100 -0
nat/eval/swe_bench_evaluator/evaluate.py +6 -6
nat/eval/trajectory_evaluator/evaluate.py +1 -1
nat/eval/trajectory_evaluator/register.py +1 -1
nat/eval/tunable_rag_evaluator/evaluate.py +4 -7
nat/eval/utils/eval_trace_ctx.py +89 -0
nat/eval/utils/weave_eval.py +18 -9
nat/experimental/decorators/experimental_warning_decorator.py +27 -7
nat/experimental/test_time_compute/functions/plan_select_execute_function.py +7 -3
nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +3 -3
nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +1 -1
nat/experimental/test_time_compute/models/strategy_base.py +5 -4
nat/experimental/test_time_compute/register.py +0 -1
nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +1 -3
nat/front_ends/console/authentication_flow_handler.py +82 -30
nat/front_ends/console/console_front_end_plugin.py +8 -5
nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +52 -17
nat/front_ends/fastapi/dask_client_mixin.py +65 -0
nat/front_ends/fastapi/fastapi_front_end_config.py +36 -5
nat/front_ends/fastapi/fastapi_front_end_controller.py +4 -4
nat/front_ends/fastapi/fastapi_front_end_plugin.py +135 -4
nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +452 -282
nat/front_ends/fastapi/job_store.py +518 -99
nat/front_ends/fastapi/main.py +11 -19
nat/front_ends/fastapi/message_handler.py +13 -14
nat/front_ends/fastapi/message_validator.py +19 -19
nat/front_ends/fastapi/response_helpers.py +4 -4
nat/front_ends/fastapi/step_adaptor.py +2 -2
nat/front_ends/fastapi/utils.py +57 -0
nat/front_ends/mcp/introspection_token_verifier.py +73 -0
nat/front_ends/mcp/mcp_front_end_config.py +10 -1
nat/front_ends/mcp/mcp_front_end_plugin.py +45 -13
nat/front_ends/mcp/mcp_front_end_plugin_worker.py +116 -8
nat/front_ends/mcp/tool_converter.py +44 -14
nat/front_ends/register.py +0 -1
nat/front_ends/simple_base/simple_front_end_plugin_base.py +3 -1
nat/llm/aws_bedrock_llm.py +24 -12
nat/llm/azure_openai_llm.py +13 -6
nat/llm/litellm_llm.py +69 -0
nat/llm/nim_llm.py +20 -8
nat/llm/openai_llm.py +14 -6
nat/llm/register.py +4 -1
nat/llm/utils/env_config_value.py +2 -3
nat/llm/utils/thinking.py +215 -0
nat/meta/pypi.md +9 -9
nat/object_store/register.py +0 -1
nat/observability/exporter/base_exporter.py +3 -3
nat/observability/exporter/file_exporter.py +1 -1
nat/observability/exporter/processing_exporter.py +309 -81
nat/observability/exporter/span_exporter.py +35 -15
nat/observability/exporter_manager.py +7 -7
nat/observability/mixin/file_mixin.py +7 -7
nat/observability/mixin/redaction_config_mixin.py +42 -0
nat/observability/mixin/tagging_config_mixin.py +62 -0
nat/observability/mixin/type_introspection_mixin.py +420 -107
nat/observability/processor/batching_processor.py +5 -7
nat/observability/processor/falsy_batch_filter_processor.py +55 -0
nat/observability/processor/processor.py +3 -0
nat/observability/processor/processor_factory.py +70 -0
nat/observability/processor/redaction/__init__.py +24 -0
nat/observability/processor/redaction/contextual_redaction_processor.py +125 -0
nat/observability/processor/redaction/contextual_span_redaction_processor.py +66 -0
nat/observability/processor/redaction/redaction_processor.py +177 -0
nat/observability/processor/redaction/span_header_redaction_processor.py +92 -0
nat/observability/processor/span_tagging_processor.py +68 -0
nat/observability/register.py +6 -4
nat/profiler/calc/calc_runner.py +3 -4
nat/profiler/callbacks/agno_callback_handler.py +1 -1
nat/profiler/callbacks/langchain_callback_handler.py +6 -6
nat/profiler/callbacks/llama_index_callback_handler.py +3 -3
nat/profiler/callbacks/semantic_kernel_callback_handler.py +3 -3
nat/profiler/data_frame_row.py +1 -1
nat/profiler/decorators/framework_wrapper.py +62 -13
nat/profiler/decorators/function_tracking.py +160 -3
nat/profiler/forecasting/models/forecasting_base_model.py +3 -1
nat/profiler/forecasting/models/linear_model.py +1 -1
nat/profiler/forecasting/models/random_forest_regressor.py +1 -1
nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +1 -1
nat/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +1 -1
nat/profiler/inference_optimization/data_models.py +3 -3
nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +8 -9
nat/profiler/inference_optimization/token_uniqueness.py +1 -1
nat/profiler/parameter_optimization/__init__.py +0 -0
nat/profiler/parameter_optimization/optimizable_utils.py +93 -0
nat/profiler/parameter_optimization/optimizer_runtime.py +67 -0
nat/profiler/parameter_optimization/parameter_optimizer.py +153 -0
nat/profiler/parameter_optimization/parameter_selection.py +107 -0
nat/profiler/parameter_optimization/pareto_visualizer.py +380 -0
nat/profiler/parameter_optimization/prompt_optimizer.py +384 -0
nat/profiler/parameter_optimization/update_helpers.py +66 -0
nat/profiler/profile_runner.py +14 -9
nat/profiler/utils.py +4 -2
nat/registry_handlers/local/local_handler.py +2 -2
nat/registry_handlers/package_utils.py +1 -2
nat/registry_handlers/pypi/pypi_handler.py +23 -26
nat/registry_handlers/register.py +3 -4
nat/registry_handlers/rest/rest_handler.py +12 -13
nat/retriever/milvus/retriever.py +2 -2
nat/retriever/nemo_retriever/retriever.py +1 -1
nat/retriever/register.py +0 -1
nat/runtime/loader.py +2 -2
nat/runtime/runner.py +106 -8
nat/runtime/session.py +69 -8
nat/settings/global_settings.py +16 -5
nat/tool/chat_completion.py +5 -2
nat/tool/code_execution/local_sandbox/local_sandbox_server.py +3 -3
nat/tool/datetime_tools.py +49 -9
nat/tool/document_search.py +2 -2
nat/tool/github_tools.py +450 -0
nat/tool/memory_tools/get_memory_tool.py +1 -1
nat/tool/nvidia_rag.py +1 -1
nat/tool/register.py +2 -9
nat/tool/retriever.py +3 -2
nat/utils/callable_utils.py +70 -0
nat/utils/data_models/schema_validator.py +3 -3
nat/utils/decorators.py +210 -0
nat/utils/exception_handlers/automatic_retries.py +104 -51
nat/utils/exception_handlers/schemas.py +1 -1
nat/utils/io/yaml_tools.py +2 -2
nat/utils/log_levels.py +25 -0
nat/utils/reactive/base/observable_base.py +2 -2
nat/utils/reactive/base/observer_base.py +1 -1
nat/utils/reactive/observable.py +2 -2
nat/utils/reactive/observer.py +4 -4
nat/utils/reactive/subscription.py +1 -1
nat/utils/settings/global_settings.py +6 -8
nat/utils/type_converter.py +4 -3
nat/utils/type_utils.py +9 -5
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/METADATA +42 -18
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/RECORD +238 -196
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/entry_points.txt +1 -0
nat/cli/commands/info/list_mcp.py +0 -304
nat/tool/github_tools/create_github_commit.py +0 -133
nat/tool/github_tools/create_github_issue.py +0 -87
nat/tool/github_tools/create_github_pr.py +0 -106
nat/tool/github_tools/get_github_file.py +0 -106
nat/tool/github_tools/get_github_issue.py +0 -166
nat/tool/github_tools/get_github_pr.py +0 -256
nat/tool/github_tools/update_github_issue.py +0 -100
nat/tool/mcp/exceptions.py +0 -142
nat/tool/mcp/mcp_client.py +0 -255
nat/tool/mcp/mcp_tool.py +0 -96
nat/utils/exception_handlers/mcp.py +0 -211
/nat/{tool/github_tools → agent/prompt_optimizer}/__init__.py +0 -0
/nat/{tool/mcp → authentication/credential_validator}/__init__.py +0 -0
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/WHEEL +0 -0
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/licenses/LICENSE-3rd-party.txt +0 -0
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/licenses/LICENSE.md +0 -0
{nvidia_nat-1.3.0.dev2.dist-info → nvidia_nat-1.3.0rc2.dist-info}/top_level.txt +0 -0

nat/profiler/parameter_optimization/prompt_optimizer.py ADDED Viewed

@@ -0,0 +1,384 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import asyncio
+import json
+import logging
+import random
+from collections.abc import Sequence
+from dataclasses import dataclass
+from typing import Any
+from pydantic import BaseModel
+from nat.builder.workflow_builder import WorkflowBuilder
+from nat.data_models.config import Config
+from nat.data_models.optimizable import SearchSpace
+from nat.data_models.optimizer import OptimizerConfig
+from nat.data_models.optimizer import OptimizerRunConfig
+from nat.eval.evaluate import EvaluationRun
+from nat.eval.evaluate import EvaluationRunConfig
+from nat.experimental.decorators.experimental_warning_decorator import experimental
+from nat.profiler.parameter_optimization.update_helpers import apply_suggestions
+logger = logging.getLogger(__name__)
+class PromptOptimizerInputSchema(BaseModel):
+    original_prompt: str
+    objective: str
+    oracle_feedback: str | None = None
+@experimental(feature_name="Optimizer")
+async def optimize_prompts(
+    *,
+    base_cfg: Config,
+    full_space: dict[str, SearchSpace],
+    optimizer_config: OptimizerConfig,
+    opt_run_config: OptimizerRunConfig,
+) -> None:
+    # ------------- helpers ------------- #
+    @dataclass
+    class Individual:
+        prompts: dict[str, str]  # param_name -> prompt text
+        metrics: dict[str, float] | None = None  # evaluator_name -> average score
+        scalar_fitness: float | None = None
+    def _normalize_generation(
+        individuals: Sequence[Individual],
+        metric_names: Sequence[str],
+        directions: Sequence[str],
+        eps: float = 1e-12,
+    ) -> list[dict[str, float]]:
+        """Return per-individual dict of normalised scores in [0,1] where higher is better."""
+        # Extract arrays per metric
+        arrays = {m: [ind.metrics.get(m, 0.0) if ind.metrics else 0.0 for ind in individuals] for m in metric_names}
+        normed: list[dict[str, float]] = []
+        for i in range(len(individuals)):
+            entry: dict[str, float] = {}
+            for m, dirn in zip(metric_names, directions):
+                vals = arrays[m]
+                vmin = min(vals)
+                vmax = max(vals)
+                v = vals[i]
+                # Map to [0,1] with higher=better regardless of direction
+                if vmax - vmin < eps:
+                    score01 = 0.5
+                else:
+                    score01 = (v - vmin) / (vmax - vmin)
+                if dirn == "minimize":
+                    score01 = 1.0 - score01
+                entry[m] = float(score01)
+            normed.append(entry)
+        return normed
+    def _scalarize(norm_scores: dict[str, float], *, mode: str, weights: Sequence[float] | None) -> float:
+        """Collapse normalised scores to a single scalar (higher is better)."""
+        vals = list(norm_scores.values())
+        if not vals:
+            return 0.0
+        if mode == "harmonic":
+            inv_sum = sum(1.0 / max(v, 1e-12) for v in vals)
+            return len(vals) / max(inv_sum, 1e-12)
+        if mode == "sum":
+            if weights is None:
+                return float(sum(vals))
+            if len(weights) != len(vals):
+                raise ValueError("weights length must equal number of objectives")
+            return float(sum(w * v for w, v in zip(weights, vals)))
+        if mode == "chebyshev":
+            return float(min(vals))  # maximise the worst-case score
+        raise ValueError(f"Unknown combination mode: {mode}")
+    def _apply_diversity_penalty(individuals: Sequence[Individual], diversity_lambda: float) -> list[float]:
+        if diversity_lambda <= 0.0:
+            return [0.0 for _ in individuals]
+        seen: dict[str, int] = {}
+        keys: list[str] = []
+        penalties: list[float] = []
+        for ind in individuals:
+            key = "\u241f".join(ind.prompts.get(k, "") for k in sorted(ind.prompts.keys()))
+            keys.append(key)
+            seen[key] = seen.get(key, 0) + 1
+        for key in keys:
+            duplicates = seen[key] - 1
+            penalties.append(diversity_lambda * float(duplicates))
+        return penalties
+    def _tournament_select(pop: Sequence[Individual], k: int) -> Individual:
+        contenders = random.sample(pop, k=min(k, len(pop)))
+        return max(contenders, key=lambda i: (i.scalar_fitness or 0.0))
+    # ------------- discover space ------------- #
+    prompt_space: dict[str, tuple[str, str]] = {
+        k: (v.prompt, v.prompt_purpose)
+        for k, v in full_space.items() if v.is_prompt
+    }
+    if not prompt_space:
+        logger.info("No prompts to optimize – skipping.")
+        return
+    metric_cfg = optimizer_config.eval_metrics
+    if metric_cfg is None or len(metric_cfg) == 0:
+        raise ValueError("optimizer_config.eval_metrics must be provided for GA prompt optimization")
+    directions = [v.direction for v in metric_cfg.values()]  # "minimize" or "maximize"
+    eval_metrics = [v.evaluator_name for v in metric_cfg.values()]
+    weights = [v.weight for v in metric_cfg.values()]
+    out_dir = optimizer_config.output_path
+    out_dir.mkdir(parents=True, exist_ok=True)
+    # ------------- builder & functions ------------- #
+    async with WorkflowBuilder(general_config=base_cfg.general, registry=None) as builder:
+        await builder.populate_builder(base_cfg)
+        init_fn_name = (optimizer_config.prompt.prompt_population_init_function)
+        if not init_fn_name:
+            raise ValueError(
+                "No prompt optimization function configured. Set optimizer.prompt_population_init_function")
+        init_fn = await builder.get_function(init_fn_name)
+        recombine_fn = None
+        if optimizer_config.prompt.prompt_recombination_function:
+            recombine_fn = await builder.get_function(optimizer_config.prompt.prompt_recombination_function)
+        logger.info(
+            "GA Prompt optimization ready: init_fn=%s, recombine_fn=%s",
+            init_fn_name,
+            optimizer_config.prompt.prompt_recombination_function,
+        )
+        # ------------- GA parameters ------------- #
+        pop_size = max(2, int(optimizer_config.prompt.ga_population_size))
+        generations = max(1, int(optimizer_config.prompt.ga_generations))
+        offspring_size = (optimizer_config.prompt.ga_offspring_size
+                          or max(0, pop_size - optimizer_config.prompt.ga_elitism))
+        crossover_rate = float(optimizer_config.prompt.ga_crossover_rate)
+        mutation_rate = float(optimizer_config.prompt.ga_mutation_rate)
+        elitism = max(0, int(optimizer_config.prompt.ga_elitism))
+        selection_method = optimizer_config.prompt.ga_selection_method.lower()
+        tournament_size = max(2, int(optimizer_config.prompt.ga_tournament_size))
+        max_eval_concurrency = max(1, int(optimizer_config.prompt.ga_parallel_evaluations))
+        diversity_lambda = float(optimizer_config.prompt.ga_diversity_lambda)
+        # ------------- population init ------------- #
+        async def _mutate_prompt(original_prompt: str, purpose: str) -> str:
+            # Use LLM-based optimizer with no feedback
+            return await init_fn.acall_invoke(
+                PromptOptimizerInputSchema(
+                    original_prompt=original_prompt,
+                    objective=purpose,
+                    oracle_feedback=None,
+                ))
+        async def _recombine_prompts(a: str, b: str, purpose: str) -> str:
+            if recombine_fn is None:
+                # Fallback: uniform choice per recombination
+                return random.choice([a, b])
+            payload = {"original_prompt": a, "objective": purpose, "oracle_feedback": None, "parent_b": b}
+            return await recombine_fn.acall_invoke(payload)
+        def _make_individual_from_prompts(prompts: dict[str, str]) -> Individual:
+            return Individual(prompts=dict(prompts))
+        async def _initial_population() -> list[Individual]:
+            individuals: list[Individual] = []
+            # Ensure first individual is the original prompts
+            originals = {k: prompt_space[k][0] for k in prompt_space}
+            individuals.append(_make_individual_from_prompts(originals))
+            init_sem = asyncio.Semaphore(max_eval_concurrency)
+            async def _create_random_individual() -> Individual:
+                async with init_sem:
+                    mutated: dict[str, str] = {}
+                    for param, (base_prompt, purpose) in prompt_space.items():
+                        try:
+                            new_p = await _mutate_prompt(base_prompt, purpose)
+                        except Exception as e:
+                            logger.warning("Mutation failed for %s: %s; using original.", param, e)
+                            new_p = base_prompt
+                        mutated[param] = new_p
+                    return _make_individual_from_prompts(mutated)
+            needed = max(0, pop_size - 1)
+            tasks = [_create_random_individual() for _ in range(needed)]
+            individuals.extend(await asyncio.gather(*tasks))
+            return individuals
+        # ------------- evaluation ------------- #
+        reps = max(1, getattr(optimizer_config, "reps_per_param_set", 1))
+        sem = asyncio.Semaphore(max_eval_concurrency)
+        async def _evaluate(ind: Individual) -> Individual:
+            async with sem:
+                cfg_trial = apply_suggestions(base_cfg, ind.prompts)
+            eval_cfg = EvaluationRunConfig(
+                config_file=cfg_trial,
+                dataset=opt_run_config.dataset,
+                result_json_path=opt_run_config.result_json_path,
+                endpoint=opt_run_config.endpoint,
+                endpoint_timeout=opt_run_config.endpoint_timeout,
+                override=opt_run_config.override,
+            )
+            # Run reps sequentially under the same semaphore to avoid overload
+            all_results: list[list[tuple[str, Any]]] = []
+            for _ in range(reps):
+                res = (await EvaluationRun(config=eval_cfg).run_and_evaluate()).evaluation_results
+                all_results.append(res)
+            metrics: dict[str, float] = {}
+            for metric_name in eval_metrics:
+                scores: list[float] = []
+                for run_results in all_results:
+                    for name, result in run_results:
+                        if name == metric_name:
+                            scores.append(result.average_score)
+                            break
+                metrics[metric_name] = float(sum(scores) / len(scores)) if scores else 0.0
+            ind.metrics = metrics
+            return ind
+        async def _evaluate_population(pop: list[Individual]) -> list[Individual]:
+            # Evaluate those missing metrics
+            unevaluated = [ind for ind in pop if not ind.metrics]
+            if unevaluated:
+                evaluated = await asyncio.gather(*[_evaluate(ind) for ind in unevaluated])
+                # in-place update
+                for ind, ev in zip(unevaluated, evaluated):
+                    ind.metrics = ev.metrics
+            # Scalarize
+            norm_per_ind = _normalize_generation(pop, eval_metrics, directions)
+            penalties = _apply_diversity_penalty(pop, diversity_lambda)
+            for ind, norm_scores, penalty in zip(pop, norm_per_ind, penalties):
+                ind.scalar_fitness = _scalarize(
+                    norm_scores, mode=optimizer_config.multi_objective_combination_mode, weights=weights) - penalty
+            return pop
+        # ------------- reproduction ops ------------- #
+        async def _make_child(parent_a: Individual, parent_b: Individual) -> Individual:
+            child_prompts: dict[str, str] = {}
+            for param, (base_prompt, purpose) in prompt_space.items():
+                pa = parent_a.prompts.get(param, base_prompt)
+                pb = parent_b.prompts.get(param, base_prompt)
+                child = pa
+                # crossover
+                if random.random() < crossover_rate:
+                    try:
+                        child = await _recombine_prompts(pa, pb, purpose)
+                    except Exception as e:
+                        logger.warning("Recombination failed for %s: %s; falling back to parent.", param, e)
+                        child = random.choice([pa, pb])
+                # mutation
+                if random.random() < mutation_rate:
+                    try:
+                        child = await _mutate_prompt(child, purpose)
+                    except Exception as e:
+                        logger.warning("Mutation failed for %s: %s; keeping child as-is.", param, e)
+                child_prompts[param] = child
+            return _make_individual_from_prompts(child_prompts)
+        # ------------- GA loop ------------- #
+        population = await _initial_population()
+        history_rows: list[dict[str, Any]] = []
+        for gen in range(1, generations + 1):
+            logger.info("[GA] Generation %d/%d: evaluating population of %d", gen, generations, len(population))
+            population = await _evaluate_population(population)
+            # Log and save checkpoint
+            best = max(population, key=lambda i: (i.scalar_fitness or 0.0))
+            checkpoint = {k: (best.prompts[k], prompt_space[k][1]) for k in prompt_space}
+            checkpoint_path = out_dir / f"optimized_prompts_gen{gen}.json"
+            with checkpoint_path.open("w") as fh:
+                json.dump(checkpoint, fh, indent=2)
+            logger.info("[GA] Saved checkpoint: %s (fitness=%.4f)", checkpoint_path, best.scalar_fitness or 0.0)
+            # Append history
+            for idx, ind in enumerate(population):
+                row = {
+                    "generation": gen,
+                    "index": idx,
+                    "scalar_fitness": ind.scalar_fitness,
+                }
+                if ind.metrics:
+                    row.update({f"metric::{m}": ind.metrics[m] for m in eval_metrics})
+                history_rows.append(row)
+            # Next generation via elitism + reproduction
+            next_population: list[Individual] = []
+            if elitism > 0:
+                elites = sorted(population, key=lambda i: (i.scalar_fitness or 0.0), reverse=True)[:elitism]
+                next_population.extend([_make_individual_from_prompts(e.prompts) for e in elites])
+            def _select_parent(curr_pop: list[Individual]) -> Individual:
+                if selection_method == "tournament":
+                    return _tournament_select(curr_pop, tournament_size)
+                # roulette wheel
+                total = sum(max(ind.scalar_fitness or 0.0, 0.0) for ind in curr_pop) or 1.0
+                r = random.random() * total
+                acc = 0.0
+                for ind in curr_pop:
+                    acc += max(ind.scalar_fitness or 0.0, 0.0)
+                    if acc >= r:
+                        return ind
+                return curr_pop[-1]
+            # Produce offspring
+            needed = pop_size - len(next_population)
+            offspring: list[Individual] = []
+            for _ in range(max(0, offspring_size), needed):
+                pass  # ensure bound correctness
+            while len(offspring) < needed:
+                p1 = _select_parent(population)
+                p2 = _select_parent(population)
+                if p2 is p1 and len(population) > 1:
+                    p2 = random.choice([ind for ind in population if ind is not p1])
+                child = await _make_child(p1, p2)
+                offspring.append(child)
+            population = next_population + offspring
+        # Final evaluation to ensure metrics present
+        population = await _evaluate_population(population)
+        best = max(population, key=lambda i: (i.scalar_fitness or 0.0))
+        best_prompts = {k: (best.prompts[k], prompt_space[k][1]) for k in prompt_space}
+        # Save final
+        final_prompts_path = out_dir / "optimized_prompts.json"
+        with final_prompts_path.open("w") as fh:
+            json.dump(best_prompts, fh, indent=2)
+        trials_df_path = out_dir / "ga_history_prompts.csv"
+        try:
+            # Lazy import pandas if available; otherwise write CSV manually
+            import csv  # pylint: disable=import-outside-toplevel
+            fieldnames: list[str] = sorted({k for row in history_rows for k in row.keys()})
+            with trials_df_path.open("w", newline="") as f:
+                writer = csv.DictWriter(f, fieldnames=fieldnames)
+                writer.writeheader()
+                for row in history_rows:
+                    writer.writerow(row)
+        except Exception as e:  # pragma: no cover - best effort
+            logger.warning("Failed to write GA history CSV: %s", e)
+        logger.info("Prompt GA optimization finished successfully!")
+        logger.info("Final prompts saved to: %s", final_prompts_path)
+        logger.info("History saved to: %s", trials_df_path)

nat/profiler/parameter_optimization/update_helpers.py ADDED Viewed

@@ -0,0 +1,66 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from collections import defaultdict
+from typing import Any
+from pydantic import BaseModel
+def _deep_merge_dict(target: dict[str, Any], updates: dict[str, Any]) -> None:
+    """In-place deep merge of nested dictionaries."""
+    for key, value in updates.items():
+        if key in target and isinstance(target[key], dict) and isinstance(value, dict):
+            _deep_merge_dict(target[key], value)
+        else:
+            target[key] = value
+def nest_updates(flat: dict[str, Any]) -> dict[str, Any]:
+    """
+    Convert ``{'a.b.c': 1, 'd.x.y': 2}`` ➜
+    ``{'a': {'b': {'c': 1}}, 'd': {'x': {'y': 2}}}``.
+    Works even when the middle segment is a dict key.
+    """
+    root: dict[str, Any] = defaultdict(dict)
+    for dotted, value in flat.items():
+        head, *rest = dotted.split(".", 1)
+        if not rest:  # leaf
+            root[head] = value
+            continue
+        tail = rest[0]
+        child_updates = nest_updates({tail: value})
+        if isinstance(root[head], dict):
+            _deep_merge_dict(root[head], child_updates)
+        else:
+            root[head] = child_updates
+    return dict(root)
+def apply_suggestions(cfg: BaseModel, flat: dict[str, Any]) -> BaseModel:
+    """
+    Return a **new** config where only the dotted-path keys in *flat*
+    have been modified. Preserves all unrelated siblings.
+    """
+    cfg_dict = cfg.model_dump(mode="python")
+    for dotted, value in flat.items():
+        keys = dotted.split(".")
+        cursor = cfg_dict
+        for key in keys[:-1]:
+            cursor = cursor.setdefault(key, {})
+        cursor[keys[-1]] = value
+    return cfg.__class__.model_validate(cfg_dict)

nat/profiler/profile_runner.py CHANGED Viewed

@@ -88,14 +88,19 @@ class ProfilerRunner:
         writes out combined requests JSON, then computes and saves additional metrics,
         and optionally fits a forecasting model.
         """
-        from nat.profiler.inference_optimization.bottleneck_analysis.nested_stack_analysis import \
-            multi_example_call_profiling
-        from nat.profiler.inference_optimization.bottleneck_analysis.simple_stack_analysis import \
-            profile_workflow_bottlenecks
-        from nat.profiler.inference_optimization.experimental.concurrency_spike_analysis import \
-            concurrency_spike_analysis
-        from nat.profiler.inference_optimization.experimental.prefix_span_analysis import \
-            prefixspan_subworkflow_with_text
+        # Yapf and ruff disagree on how to format long imports, disable yapf go with ruff
+        from nat.profiler.inference_optimization.bottleneck_analysis.nested_stack_analysis import (
+            multi_example_call_profiling,
+        )  # yapf: disable
+        from nat.profiler.inference_optimization.bottleneck_analysis.simple_stack_analysis import (
+            profile_workflow_bottlenecks,
+        )  # yapf: disable
+        from nat.profiler.inference_optimization.experimental.concurrency_spike_analysis import (
+            concurrency_spike_analysis,
+        )  # yapf: disable
+        from nat.profiler.inference_optimization.experimental.prefix_span_analysis import (
+            prefixspan_subworkflow_with_text,
+        )  # yapf: disable
         from nat.profiler.inference_optimization.llm_metrics import LLMMetrics
         from nat.profiler.inference_optimization.prompt_caching import get_common_prefixes
         from nat.profiler.inference_optimization.token_uniqueness import compute_inter_query_token_uniqueness_by_llm
@@ -277,7 +282,7 @@ class ProfilerRunner:
                 fitted_model = model_trainer.train(all_steps)
                 logger.info("Fitted model for forecasting.")
             except Exception as e:
-                logger.exception("Fitting model failed. %s", e, exc_info=True)
+                logger.exception("Fitting model failed. %s", e)
                 return ProfilerResults()
             if self.write_output:

nat/profiler/utils.py CHANGED Viewed

@@ -22,6 +22,7 @@ from typing import Any
 import pandas as pd
 from nat.builder.framework_enum import LLMFrameworkEnum
+from nat.cli.type_registry import RegisteredFunctionGroupInfo
 from nat.cli.type_registry import RegisteredFunctionInfo
 from nat.data_models.intermediate_step import IntermediateStep
 from nat.profiler.data_frame_row import DataFrameRow
@@ -32,7 +33,8 @@ _FRAMEWORK_REGEX_MAP = {t: fr'\b{t._name_}\b' for t in LLMFrameworkEnum}
 logger = logging.getLogger(__name__)
-def detect_llm_frameworks_in_build_fn(registration: RegisteredFunctionInfo) -> list[LLMFrameworkEnum]:
+def detect_llm_frameworks_in_build_fn(
+        registration: RegisteredFunctionInfo | RegisteredFunctionGroupInfo) -> list[LLMFrameworkEnum]:
     """
     Analyze a function's source (the build_fn) to see which LLM frameworks it uses. Also recurses
     into any additional Python functions that the build_fn calls while passing `builder`, so that
@@ -175,7 +177,7 @@ def create_standardized_dataframe(requests_data: list[list[IntermediateStep]]) -
                                  event_type=step.event_type).model_dump(), )
     except Exception as e:
-        logger.exception("Error creating standardized DataFrame: %s", e, exc_info=True)
+        logger.exception("Error creating standardized DataFrame: %s", e)
         return pd.DataFrame()
     if not all_rows:

nat/registry_handlers/local/local_handler.py CHANGED Viewed

@@ -133,7 +133,7 @@ class LocalRegistryHandler(AbstractRegistryHandler):
                                                            "message": msg,
                                                            "action": ActionEnum.SEARCH
                                                        })
-            logger.exception(validated_search_response.status.message, exc_info=True)
+            logger.exception(validated_search_response.status.message)
             yield validated_search_response
@@ -168,7 +168,7 @@ class LocalRegistryHandler(AbstractRegistryHandler):
             validated_remove_response = RemoveResponse(status={
                 "status": StatusEnum.ERROR, "message": msg, "action": ActionEnum.REMOVE
             })  # type: ignore
-            logger.exception(validated_remove_response.status.message, exc_info=True)
+            logger.exception(validated_remove_response.status.message)
             yield validated_remove_response

nat/registry_handlers/package_utils.py CHANGED Viewed

@@ -29,7 +29,6 @@ from nat.registry_handlers.schemas.publish import Artifact
 from nat.runtime.loader import PluginTypes
 from nat.runtime.loader import discover_entrypoints
-# pylint: disable=redefined-outer-name
 logger = logging.getLogger(__name__)
@@ -397,7 +396,7 @@ def get_transitive_dependencies(distribution_names: list[str]) -> dict[str, set[
                     except importlib.metadata.PackageNotFoundError:
                         pass
-                logger.error("Distribution %s not found (tried common variations)", dist_name)
+                logger.error("Distribution %s not found (tried common variations)", dist_name, exc_info=True)
                 result[dist_name] = set()
     return result

nat/registry_handlers/pypi/pypi_handler.py CHANGED Viewed

@@ -44,13 +44,12 @@ class PypiRegistryHandler(AbstractRegistryHandler):
     https://github.com/pypiserver/pypiserver
     """
-    def __init__(  # pylint: disable=R0917
-            self,
-            endpoint: str,
-            token: str | None = None,
-            publish_route: str = "",
-            pull_route: str = "",
-            search_route: str = ""):
+    def __init__(self,
+                 endpoint: str,
+                 token: str | None = None,
+                 publish_route: str = "",
+                 pull_route: str = "",
+                 search_route: str = ""):
         super().__init__()
         self._endpoint = endpoint.rstrip("/")
         self._token = token
@@ -86,7 +85,7 @@ class PypiRegistryHandler(AbstractRegistryHandler):
             validated_publish_response = PublishResponse(status={
                 "status": StatusEnum.ERROR, "message": msg, "action": ActionEnum.PUBLISH
             })
-            logger.exception(validated_publish_response.status.message, exc_info=True)
+            logger.exception(validated_publish_response.status.message)
             yield validated_publish_response
@@ -126,17 +125,16 @@ class PypiRegistryHandler(AbstractRegistryHandler):
             versioned_packages_str = " ".join(versioned_packages)
-            result = subprocess.run(
-                [
-                    "uv",
-                    "pip",
-                    "install",
-                    "--prerelease=allow",
-                    "--index-url",
-                    f"{self._endpoint}/{self._pull_route}/",
-                    versioned_packages_str
-                ],  # pylint: disable=W0631
-                check=True)
+            result = subprocess.run([
+                "uv",
+                "pip",
+                "install",
+                "--prerelease=allow",
+                "--index-url",
+                f"{self._endpoint}/{self._pull_route}/",
+                versioned_packages_str
+            ],
+                                    check=True)
             result.check_returncode()
@@ -151,7 +149,7 @@ class PypiRegistryHandler(AbstractRegistryHandler):
             validated_pull_response = PullResponse(status={
                 "status": StatusEnum.ERROR, "message": msg, "action": ActionEnum.PULL
             })
-            logger.exception(validated_pull_response.status.message, exc_info=True)
+            logger.exception(validated_pull_response.status.message)
             yield validated_pull_response
@@ -171,11 +169,10 @@ class PypiRegistryHandler(AbstractRegistryHandler):
         """
         try:
-            completed_process = subprocess.run(
-                ["pip", "search", "--index", f"{self._endpoint}", query.query],  # pylint: disable=W0631
-                text=True,
-                capture_output=True,
-                check=True)
+            completed_process = subprocess.run(["pip", "search", "--index", f"{self._endpoint}", query.query],
+                                               text=True,
+                                               capture_output=True,
+                                               check=True)
             search_response_list = []
             search_results = completed_process.stdout
             package_results = search_results.split("\n")
@@ -215,7 +212,7 @@ class PypiRegistryHandler(AbstractRegistryHandler):
         except Exception as e:
             msg = f"Error searching for artifacts: {e}"
-            logger.exception(msg, exc_info=True)
+            logger.exception(msg)
             validated_search_response = SearchResponse(params=query,
                                                        status={
                                                            "status": StatusEnum.ERROR,

nat/registry_handlers/register.py CHANGED Viewed

@@ -13,9 +13,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-# pylint: disable=unused-import
 # flake8: noqa
-from .local import register_local  # pylint: disable=E0611
-from .pypi import register_pypi  # pylint: disable=E0611
-from .rest import register_rest  # pylint: disable=E0611
+from .local import register_local
+from .pypi import register_pypi
+from .rest import register_rest

nvidia-nat 1.3.0.dev2__py3-none-any.whl → 1.3.0rc2__py3-none-any.whl

nvidia-nat 1.3.0.dev2py3-none-any.whl → 1.3.0rc2py3-none-any.whl