nvidia-nat 1.2.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/__init__.py +66 -0
- nat/agent/__init__.py +0 -0
- nat/agent/base.py +256 -0
- nat/agent/dual_node.py +67 -0
- nat/agent/react_agent/__init__.py +0 -0
- nat/agent/react_agent/agent.py +363 -0
- nat/agent/react_agent/output_parser.py +104 -0
- nat/agent/react_agent/prompt.py +44 -0
- nat/agent/react_agent/register.py +149 -0
- nat/agent/reasoning_agent/__init__.py +0 -0
- nat/agent/reasoning_agent/reasoning_agent.py +225 -0
- nat/agent/register.py +23 -0
- nat/agent/rewoo_agent/__init__.py +0 -0
- nat/agent/rewoo_agent/agent.py +415 -0
- nat/agent/rewoo_agent/prompt.py +110 -0
- nat/agent/rewoo_agent/register.py +157 -0
- nat/agent/tool_calling_agent/__init__.py +0 -0
- nat/agent/tool_calling_agent/agent.py +119 -0
- nat/agent/tool_calling_agent/register.py +106 -0
- nat/authentication/__init__.py +14 -0
- nat/authentication/api_key/__init__.py +14 -0
- nat/authentication/api_key/api_key_auth_provider.py +96 -0
- nat/authentication/api_key/api_key_auth_provider_config.py +124 -0
- nat/authentication/api_key/register.py +26 -0
- nat/authentication/exceptions/__init__.py +14 -0
- nat/authentication/exceptions/api_key_exceptions.py +38 -0
- nat/authentication/http_basic_auth/__init__.py +0 -0
- nat/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- nat/authentication/http_basic_auth/register.py +30 -0
- nat/authentication/interfaces.py +93 -0
- nat/authentication/oauth2/__init__.py +14 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- nat/authentication/oauth2/register.py +25 -0
- nat/authentication/register.py +21 -0
- nat/builder/__init__.py +0 -0
- nat/builder/builder.py +285 -0
- nat/builder/component_utils.py +316 -0
- nat/builder/context.py +270 -0
- nat/builder/embedder.py +24 -0
- nat/builder/eval_builder.py +161 -0
- nat/builder/evaluator.py +29 -0
- nat/builder/framework_enum.py +24 -0
- nat/builder/front_end.py +73 -0
- nat/builder/function.py +344 -0
- nat/builder/function_base.py +380 -0
- nat/builder/function_info.py +627 -0
- nat/builder/intermediate_step_manager.py +174 -0
- nat/builder/llm.py +25 -0
- nat/builder/retriever.py +25 -0
- nat/builder/user_interaction_manager.py +78 -0
- nat/builder/workflow.py +148 -0
- nat/builder/workflow_builder.py +1117 -0
- nat/cli/__init__.py +14 -0
- nat/cli/cli_utils/__init__.py +0 -0
- nat/cli/cli_utils/config_override.py +231 -0
- nat/cli/cli_utils/validation.py +37 -0
- nat/cli/commands/__init__.py +0 -0
- nat/cli/commands/configure/__init__.py +0 -0
- nat/cli/commands/configure/channel/__init__.py +0 -0
- nat/cli/commands/configure/channel/add.py +28 -0
- nat/cli/commands/configure/channel/channel.py +34 -0
- nat/cli/commands/configure/channel/remove.py +30 -0
- nat/cli/commands/configure/channel/update.py +30 -0
- nat/cli/commands/configure/configure.py +33 -0
- nat/cli/commands/evaluate.py +139 -0
- nat/cli/commands/info/__init__.py +14 -0
- nat/cli/commands/info/info.py +37 -0
- nat/cli/commands/info/list_channels.py +32 -0
- nat/cli/commands/info/list_components.py +129 -0
- nat/cli/commands/info/list_mcp.py +304 -0
- nat/cli/commands/registry/__init__.py +14 -0
- nat/cli/commands/registry/publish.py +88 -0
- nat/cli/commands/registry/pull.py +118 -0
- nat/cli/commands/registry/registry.py +36 -0
- nat/cli/commands/registry/remove.py +108 -0
- nat/cli/commands/registry/search.py +155 -0
- nat/cli/commands/sizing/__init__.py +14 -0
- nat/cli/commands/sizing/calc.py +297 -0
- nat/cli/commands/sizing/sizing.py +27 -0
- nat/cli/commands/start.py +246 -0
- nat/cli/commands/uninstall.py +81 -0
- nat/cli/commands/validate.py +47 -0
- nat/cli/commands/workflow/__init__.py +14 -0
- nat/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- nat/cli/commands/workflow/templates/config.yml.j2 +16 -0
- nat/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- nat/cli/commands/workflow/templates/register.py.j2 +5 -0
- nat/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- nat/cli/commands/workflow/workflow.py +37 -0
- nat/cli/commands/workflow/workflow_commands.py +317 -0
- nat/cli/entrypoint.py +135 -0
- nat/cli/main.py +57 -0
- nat/cli/register_workflow.py +488 -0
- nat/cli/type_registry.py +1000 -0
- nat/data_models/__init__.py +14 -0
- nat/data_models/api_server.py +716 -0
- nat/data_models/authentication.py +231 -0
- nat/data_models/common.py +171 -0
- nat/data_models/component.py +58 -0
- nat/data_models/component_ref.py +168 -0
- nat/data_models/config.py +410 -0
- nat/data_models/dataset_handler.py +169 -0
- nat/data_models/discovery_metadata.py +305 -0
- nat/data_models/embedder.py +27 -0
- nat/data_models/evaluate.py +127 -0
- nat/data_models/evaluator.py +26 -0
- nat/data_models/front_end.py +26 -0
- nat/data_models/function.py +30 -0
- nat/data_models/function_dependencies.py +72 -0
- nat/data_models/interactive.py +246 -0
- nat/data_models/intermediate_step.py +302 -0
- nat/data_models/invocation_node.py +38 -0
- nat/data_models/llm.py +27 -0
- nat/data_models/logging.py +26 -0
- nat/data_models/memory.py +27 -0
- nat/data_models/object_store.py +44 -0
- nat/data_models/profiler.py +54 -0
- nat/data_models/registry_handler.py +26 -0
- nat/data_models/retriever.py +30 -0
- nat/data_models/retry_mixin.py +35 -0
- nat/data_models/span.py +190 -0
- nat/data_models/step_adaptor.py +64 -0
- nat/data_models/streaming.py +33 -0
- nat/data_models/swe_bench_model.py +54 -0
- nat/data_models/telemetry_exporter.py +26 -0
- nat/data_models/ttc_strategy.py +30 -0
- nat/embedder/__init__.py +0 -0
- nat/embedder/nim_embedder.py +59 -0
- nat/embedder/openai_embedder.py +43 -0
- nat/embedder/register.py +22 -0
- nat/eval/__init__.py +14 -0
- nat/eval/config.py +60 -0
- nat/eval/dataset_handler/__init__.py +0 -0
- nat/eval/dataset_handler/dataset_downloader.py +106 -0
- nat/eval/dataset_handler/dataset_filter.py +52 -0
- nat/eval/dataset_handler/dataset_handler.py +367 -0
- nat/eval/evaluate.py +510 -0
- nat/eval/evaluator/__init__.py +14 -0
- nat/eval/evaluator/base_evaluator.py +77 -0
- nat/eval/evaluator/evaluator_model.py +45 -0
- nat/eval/intermediate_step_adapter.py +99 -0
- nat/eval/rag_evaluator/__init__.py +0 -0
- nat/eval/rag_evaluator/evaluate.py +178 -0
- nat/eval/rag_evaluator/register.py +143 -0
- nat/eval/register.py +23 -0
- nat/eval/remote_workflow.py +133 -0
- nat/eval/runners/__init__.py +14 -0
- nat/eval/runners/config.py +39 -0
- nat/eval/runners/multi_eval_runner.py +54 -0
- nat/eval/runtime_event_subscriber.py +52 -0
- nat/eval/swe_bench_evaluator/__init__.py +0 -0
- nat/eval/swe_bench_evaluator/evaluate.py +215 -0
- nat/eval/swe_bench_evaluator/register.py +36 -0
- nat/eval/trajectory_evaluator/__init__.py +0 -0
- nat/eval/trajectory_evaluator/evaluate.py +75 -0
- nat/eval/trajectory_evaluator/register.py +40 -0
- nat/eval/tunable_rag_evaluator/__init__.py +0 -0
- nat/eval/tunable_rag_evaluator/evaluate.py +245 -0
- nat/eval/tunable_rag_evaluator/register.py +52 -0
- nat/eval/usage_stats.py +41 -0
- nat/eval/utils/__init__.py +0 -0
- nat/eval/utils/output_uploader.py +140 -0
- nat/eval/utils/tqdm_position_registry.py +40 -0
- nat/eval/utils/weave_eval.py +184 -0
- nat/experimental/__init__.py +0 -0
- nat/experimental/decorators/__init__.py +0 -0
- nat/experimental/decorators/experimental_warning_decorator.py +134 -0
- nat/experimental/test_time_compute/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- nat/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- nat/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- nat/experimental/test_time_compute/functions/__init__.py +0 -0
- nat/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- nat/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +205 -0
- nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +146 -0
- nat/experimental/test_time_compute/models/__init__.py +0 -0
- nat/experimental/test_time_compute/models/editor_config.py +132 -0
- nat/experimental/test_time_compute/models/scoring_config.py +112 -0
- nat/experimental/test_time_compute/models/search_config.py +120 -0
- nat/experimental/test_time_compute/models/selection_config.py +154 -0
- nat/experimental/test_time_compute/models/stage_enums.py +43 -0
- nat/experimental/test_time_compute/models/strategy_base.py +66 -0
- nat/experimental/test_time_compute/models/tool_use_config.py +41 -0
- nat/experimental/test_time_compute/models/ttc_item.py +48 -0
- nat/experimental/test_time_compute/register.py +36 -0
- nat/experimental/test_time_compute/scoring/__init__.py +0 -0
- nat/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- nat/experimental/test_time_compute/search/__init__.py +0 -0
- nat/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- nat/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- nat/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- nat/experimental/test_time_compute/selection/__init__.py +0 -0
- nat/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- nat/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- nat/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- nat/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- nat/front_ends/__init__.py +14 -0
- nat/front_ends/console/__init__.py +14 -0
- nat/front_ends/console/authentication_flow_handler.py +233 -0
- nat/front_ends/console/console_front_end_config.py +32 -0
- nat/front_ends/console/console_front_end_plugin.py +96 -0
- nat/front_ends/console/register.py +25 -0
- nat/front_ends/cron/__init__.py +14 -0
- nat/front_ends/fastapi/__init__.py +14 -0
- nat/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- nat/front_ends/fastapi/fastapi_front_end_config.py +241 -0
- nat/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1087 -0
- nat/front_ends/fastapi/html_snippets/__init__.py +14 -0
- nat/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- nat/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- nat/front_ends/fastapi/job_store.py +183 -0
- nat/front_ends/fastapi/main.py +72 -0
- nat/front_ends/fastapi/message_handler.py +320 -0
- nat/front_ends/fastapi/message_validator.py +352 -0
- nat/front_ends/fastapi/register.py +25 -0
- nat/front_ends/fastapi/response_helpers.py +195 -0
- nat/front_ends/fastapi/step_adaptor.py +319 -0
- nat/front_ends/mcp/__init__.py +14 -0
- nat/front_ends/mcp/mcp_front_end_config.py +36 -0
- nat/front_ends/mcp/mcp_front_end_plugin.py +81 -0
- nat/front_ends/mcp/mcp_front_end_plugin_worker.py +143 -0
- nat/front_ends/mcp/register.py +27 -0
- nat/front_ends/mcp/tool_converter.py +241 -0
- nat/front_ends/register.py +22 -0
- nat/front_ends/simple_base/__init__.py +14 -0
- nat/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- nat/llm/__init__.py +0 -0
- nat/llm/aws_bedrock_llm.py +57 -0
- nat/llm/nim_llm.py +46 -0
- nat/llm/openai_llm.py +46 -0
- nat/llm/register.py +23 -0
- nat/llm/utils/__init__.py +14 -0
- nat/llm/utils/env_config_value.py +94 -0
- nat/llm/utils/error.py +17 -0
- nat/memory/__init__.py +20 -0
- nat/memory/interfaces.py +183 -0
- nat/memory/models.py +112 -0
- nat/meta/pypi.md +58 -0
- nat/object_store/__init__.py +20 -0
- nat/object_store/in_memory_object_store.py +76 -0
- nat/object_store/interfaces.py +84 -0
- nat/object_store/models.py +38 -0
- nat/object_store/register.py +20 -0
- nat/observability/__init__.py +14 -0
- nat/observability/exporter/__init__.py +14 -0
- nat/observability/exporter/base_exporter.py +449 -0
- nat/observability/exporter/exporter.py +78 -0
- nat/observability/exporter/file_exporter.py +33 -0
- nat/observability/exporter/processing_exporter.py +322 -0
- nat/observability/exporter/raw_exporter.py +52 -0
- nat/observability/exporter/span_exporter.py +288 -0
- nat/observability/exporter_manager.py +335 -0
- nat/observability/mixin/__init__.py +14 -0
- nat/observability/mixin/batch_config_mixin.py +26 -0
- nat/observability/mixin/collector_config_mixin.py +23 -0
- nat/observability/mixin/file_mixin.py +288 -0
- nat/observability/mixin/file_mode.py +23 -0
- nat/observability/mixin/resource_conflict_mixin.py +134 -0
- nat/observability/mixin/serialize_mixin.py +61 -0
- nat/observability/mixin/type_introspection_mixin.py +183 -0
- nat/observability/processor/__init__.py +14 -0
- nat/observability/processor/batching_processor.py +310 -0
- nat/observability/processor/callback_processor.py +42 -0
- nat/observability/processor/intermediate_step_serializer.py +28 -0
- nat/observability/processor/processor.py +71 -0
- nat/observability/register.py +96 -0
- nat/observability/utils/__init__.py +14 -0
- nat/observability/utils/dict_utils.py +236 -0
- nat/observability/utils/time_utils.py +31 -0
- nat/plugins/.namespace +1 -0
- nat/profiler/__init__.py +0 -0
- nat/profiler/calc/__init__.py +14 -0
- nat/profiler/calc/calc_runner.py +627 -0
- nat/profiler/calc/calculations.py +288 -0
- nat/profiler/calc/data_models.py +188 -0
- nat/profiler/calc/plot.py +345 -0
- nat/profiler/callbacks/__init__.py +0 -0
- nat/profiler/callbacks/agno_callback_handler.py +295 -0
- nat/profiler/callbacks/base_callback_class.py +20 -0
- nat/profiler/callbacks/langchain_callback_handler.py +290 -0
- nat/profiler/callbacks/llama_index_callback_handler.py +205 -0
- nat/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- nat/profiler/callbacks/token_usage_base_model.py +27 -0
- nat/profiler/data_frame_row.py +51 -0
- nat/profiler/data_models.py +24 -0
- nat/profiler/decorators/__init__.py +0 -0
- nat/profiler/decorators/framework_wrapper.py +131 -0
- nat/profiler/decorators/function_tracking.py +254 -0
- nat/profiler/forecasting/__init__.py +0 -0
- nat/profiler/forecasting/config.py +18 -0
- nat/profiler/forecasting/model_trainer.py +75 -0
- nat/profiler/forecasting/models/__init__.py +22 -0
- nat/profiler/forecasting/models/forecasting_base_model.py +40 -0
- nat/profiler/forecasting/models/linear_model.py +197 -0
- nat/profiler/forecasting/models/random_forest_regressor.py +269 -0
- nat/profiler/inference_metrics_model.py +28 -0
- nat/profiler/inference_optimization/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- nat/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- nat/profiler/inference_optimization/data_models.py +386 -0
- nat/profiler/inference_optimization/experimental/__init__.py +0 -0
- nat/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- nat/profiler/inference_optimization/llm_metrics.py +212 -0
- nat/profiler/inference_optimization/prompt_caching.py +163 -0
- nat/profiler/inference_optimization/token_uniqueness.py +107 -0
- nat/profiler/inference_optimization/workflow_runtimes.py +72 -0
- nat/profiler/intermediate_property_adapter.py +102 -0
- nat/profiler/profile_runner.py +473 -0
- nat/profiler/utils.py +184 -0
- nat/registry_handlers/__init__.py +0 -0
- nat/registry_handlers/local/__init__.py +0 -0
- nat/registry_handlers/local/local_handler.py +176 -0
- nat/registry_handlers/local/register_local.py +37 -0
- nat/registry_handlers/metadata_factory.py +60 -0
- nat/registry_handlers/package_utils.py +571 -0
- nat/registry_handlers/pypi/__init__.py +0 -0
- nat/registry_handlers/pypi/pypi_handler.py +251 -0
- nat/registry_handlers/pypi/register_pypi.py +40 -0
- nat/registry_handlers/register.py +21 -0
- nat/registry_handlers/registry_handler_base.py +157 -0
- nat/registry_handlers/rest/__init__.py +0 -0
- nat/registry_handlers/rest/register_rest.py +56 -0
- nat/registry_handlers/rest/rest_handler.py +237 -0
- nat/registry_handlers/schemas/__init__.py +0 -0
- nat/registry_handlers/schemas/headers.py +42 -0
- nat/registry_handlers/schemas/package.py +68 -0
- nat/registry_handlers/schemas/publish.py +68 -0
- nat/registry_handlers/schemas/pull.py +82 -0
- nat/registry_handlers/schemas/remove.py +36 -0
- nat/registry_handlers/schemas/search.py +91 -0
- nat/registry_handlers/schemas/status.py +47 -0
- nat/retriever/__init__.py +0 -0
- nat/retriever/interface.py +41 -0
- nat/retriever/milvus/__init__.py +14 -0
- nat/retriever/milvus/register.py +81 -0
- nat/retriever/milvus/retriever.py +228 -0
- nat/retriever/models.py +77 -0
- nat/retriever/nemo_retriever/__init__.py +14 -0
- nat/retriever/nemo_retriever/register.py +60 -0
- nat/retriever/nemo_retriever/retriever.py +190 -0
- nat/retriever/register.py +22 -0
- nat/runtime/__init__.py +14 -0
- nat/runtime/loader.py +220 -0
- nat/runtime/runner.py +195 -0
- nat/runtime/session.py +162 -0
- nat/runtime/user_metadata.py +130 -0
- nat/settings/__init__.py +0 -0
- nat/settings/global_settings.py +318 -0
- nat/test/.namespace +1 -0
- nat/tool/__init__.py +0 -0
- nat/tool/chat_completion.py +74 -0
- nat/tool/code_execution/README.md +151 -0
- nat/tool/code_execution/__init__.py +0 -0
- nat/tool/code_execution/code_sandbox.py +267 -0
- nat/tool/code_execution/local_sandbox/.gitignore +1 -0
- nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- nat/tool/code_execution/local_sandbox/__init__.py +13 -0
- nat/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- nat/tool/code_execution/register.py +74 -0
- nat/tool/code_execution/test_code_execution_sandbox.py +414 -0
- nat/tool/code_execution/utils.py +100 -0
- nat/tool/datetime_tools.py +42 -0
- nat/tool/document_search.py +141 -0
- nat/tool/github_tools/__init__.py +0 -0
- nat/tool/github_tools/create_github_commit.py +133 -0
- nat/tool/github_tools/create_github_issue.py +87 -0
- nat/tool/github_tools/create_github_pr.py +106 -0
- nat/tool/github_tools/get_github_file.py +106 -0
- nat/tool/github_tools/get_github_issue.py +166 -0
- nat/tool/github_tools/get_github_pr.py +256 -0
- nat/tool/github_tools/update_github_issue.py +100 -0
- nat/tool/mcp/__init__.py +14 -0
- nat/tool/mcp/exceptions.py +142 -0
- nat/tool/mcp/mcp_client.py +255 -0
- nat/tool/mcp/mcp_tool.py +96 -0
- nat/tool/memory_tools/__init__.py +0 -0
- nat/tool/memory_tools/add_memory_tool.py +79 -0
- nat/tool/memory_tools/delete_memory_tool.py +67 -0
- nat/tool/memory_tools/get_memory_tool.py +72 -0
- nat/tool/nvidia_rag.py +95 -0
- nat/tool/register.py +38 -0
- nat/tool/retriever.py +94 -0
- nat/tool/server_tools.py +66 -0
- nat/utils/__init__.py +0 -0
- nat/utils/data_models/__init__.py +0 -0
- nat/utils/data_models/schema_validator.py +58 -0
- nat/utils/debugging_utils.py +43 -0
- nat/utils/dump_distro_mapping.py +32 -0
- nat/utils/exception_handlers/__init__.py +0 -0
- nat/utils/exception_handlers/automatic_retries.py +289 -0
- nat/utils/exception_handlers/mcp.py +211 -0
- nat/utils/exception_handlers/schemas.py +114 -0
- nat/utils/io/__init__.py +0 -0
- nat/utils/io/model_processing.py +28 -0
- nat/utils/io/yaml_tools.py +119 -0
- nat/utils/log_utils.py +37 -0
- nat/utils/metadata_utils.py +74 -0
- nat/utils/optional_imports.py +142 -0
- nat/utils/producer_consumer_queue.py +178 -0
- nat/utils/reactive/__init__.py +0 -0
- nat/utils/reactive/base/__init__.py +0 -0
- nat/utils/reactive/base/observable_base.py +65 -0
- nat/utils/reactive/base/observer_base.py +55 -0
- nat/utils/reactive/base/subject_base.py +79 -0
- nat/utils/reactive/observable.py +59 -0
- nat/utils/reactive/observer.py +76 -0
- nat/utils/reactive/subject.py +131 -0
- nat/utils/reactive/subscription.py +49 -0
- nat/utils/settings/__init__.py +0 -0
- nat/utils/settings/global_settings.py +197 -0
- nat/utils/string_utils.py +38 -0
- nat/utils/type_converter.py +290 -0
- nat/utils/type_utils.py +484 -0
- nat/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0.dist-info/METADATA +365 -0
- nvidia_nat-1.2.0.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0.dist-info/entry_points.txt +21 -0
- nvidia_nat-1.2.0.dist-info/licenses/LICENSE-3rd-party.txt +5478 -0
- nvidia_nat-1.2.0.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0.dist-info/top_level.txt +2 -0
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import asyncio
|
|
17
|
+
import logging
|
|
18
|
+
import re
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
23
|
+
from nat.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
24
|
+
from nat.experimental.test_time_compute.models.scoring_config import MotivationAwareScoringConfig
|
|
25
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
26
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
27
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
28
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
29
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
30
|
+
|
|
31
|
+
logger = logging.getLogger(__name__)
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class MotivationAwareScorer(StrategyBase):
|
|
35
|
+
"""
|
|
36
|
+
A strategy that scores an TTCItem's output based on how well it
|
|
37
|
+
addresses both the original input (task) and the 'motivation' from metadata.
|
|
38
|
+
"""
|
|
39
|
+
|
|
40
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
41
|
+
super().__init__(config)
|
|
42
|
+
self.llm_bound = None
|
|
43
|
+
|
|
44
|
+
async def build_components(self, builder: Builder) -> None:
|
|
45
|
+
self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
46
|
+
|
|
47
|
+
def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
|
|
48
|
+
return [PipelineTypeEnum.TOOL_USE]
|
|
49
|
+
|
|
50
|
+
def stage_type(self) -> StageTypeEnum:
|
|
51
|
+
return StageTypeEnum.SCORING
|
|
52
|
+
|
|
53
|
+
async def ainvoke(self,
|
|
54
|
+
items: list[TTCItem],
|
|
55
|
+
original_prompt: str | None = None,
|
|
56
|
+
agent_context: str | None = None,
|
|
57
|
+
**kwargs) -> list[TTCItem]:
|
|
58
|
+
"""
|
|
59
|
+
Scores each item by combining the original 'task_description' and 'motivation' with the 'output'.
|
|
60
|
+
The resulting score is stored in item.score.
|
|
61
|
+
"""
|
|
62
|
+
from langchain_core.language_models import BaseChatModel
|
|
63
|
+
from langchain_core.prompts import PromptTemplate
|
|
64
|
+
|
|
65
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
66
|
+
raise ValueError("scoring_llm must be a BaseChatModel instance for MotivationAwareScorer.")
|
|
67
|
+
|
|
68
|
+
scoring_model: BaseChatModel = self.llm_bound
|
|
69
|
+
|
|
70
|
+
scoring_template = PromptTemplate(template=self.config.scoring_template,
|
|
71
|
+
input_variables=["task", "motivation", "output"],
|
|
72
|
+
validate_template=True)
|
|
73
|
+
|
|
74
|
+
async def score_item(item: TTCItem) -> float:
|
|
75
|
+
task_str = str(item.input) or ""
|
|
76
|
+
motivation_str = str(item.metadata) if item.metadata else ""
|
|
77
|
+
output_str = str(item.output) or ""
|
|
78
|
+
|
|
79
|
+
prompt = (await scoring_template.ainvoke({
|
|
80
|
+
"task": task_str, "motivation": motivation_str, "output": output_str
|
|
81
|
+
})).to_string()
|
|
82
|
+
|
|
83
|
+
response = (await scoring_model.ainvoke(prompt)).content
|
|
84
|
+
response = remove_r1_think_tags(response or "")
|
|
85
|
+
|
|
86
|
+
match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
|
|
87
|
+
if not match:
|
|
88
|
+
logger.warning(f"Could not parse score from response: {response}")
|
|
89
|
+
return 0.0
|
|
90
|
+
|
|
91
|
+
score_str = match.group(1)
|
|
92
|
+
try:
|
|
93
|
+
return float(score_str)
|
|
94
|
+
except ValueError:
|
|
95
|
+
logger.warning(f"Could not convert score '{score_str}' to float.")
|
|
96
|
+
return 0.0
|
|
97
|
+
|
|
98
|
+
tasks = [score_item(item) for item in items]
|
|
99
|
+
scores = await asyncio.gather(*tasks)
|
|
100
|
+
|
|
101
|
+
for i, s in enumerate(scores):
|
|
102
|
+
items[i].score = s
|
|
103
|
+
|
|
104
|
+
return items
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
@register_ttc_strategy(config_type=MotivationAwareScoringConfig)
|
|
108
|
+
async def register_motivation_aware_scorer(config: MotivationAwareScoringConfig, builder: Builder):
|
|
109
|
+
scorer = MotivationAwareScorer(config)
|
|
110
|
+
await scorer.build_components(builder)
|
|
111
|
+
yield scorer
|
|
File without changes
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import asyncio
|
|
17
|
+
import logging
|
|
18
|
+
import re
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
23
|
+
from nat.experimental.test_time_compute.models.search_config import MultiLLMPlanConfig
|
|
24
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
25
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
26
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
27
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
28
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
29
|
+
|
|
30
|
+
logger = logging.getLogger(__name__)
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
class MultiLLMPlanner(StrategyBase):
|
|
34
|
+
"""
|
|
35
|
+
A planner that uses multiple LLMs to generate plans. Each LLM can generate
|
|
36
|
+
a specified number of plans, and all plans are combined.
|
|
37
|
+
"""
|
|
38
|
+
|
|
39
|
+
def __init__(self, config: MultiLLMPlanConfig) -> None:
|
|
40
|
+
super().__init__(config)
|
|
41
|
+
self.config = config
|
|
42
|
+
self.llms_bound = [] # Will hold the "bound" LLMs after build_components
|
|
43
|
+
|
|
44
|
+
async def build_components(self, builder: Builder) -> None:
|
|
45
|
+
"""
|
|
46
|
+
Build the components required for this multi-LLM planner.
|
|
47
|
+
Binds each LLMRef from the config with the selected framework wrapper (LANGCHAIN).
|
|
48
|
+
"""
|
|
49
|
+
logger.debug("Building components for MultiLLMPlanner")
|
|
50
|
+
self.llms_bound = []
|
|
51
|
+
for llm_ref in self.config.llms:
|
|
52
|
+
bound_llm = await builder.get_llm(llm_ref, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
53
|
+
self.llms_bound.append(bound_llm)
|
|
54
|
+
|
|
55
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
56
|
+
return [PipelineTypeEnum.PLANNING]
|
|
57
|
+
|
|
58
|
+
def stage_type(self) -> StageTypeEnum:
|
|
59
|
+
return StageTypeEnum.SEARCH
|
|
60
|
+
|
|
61
|
+
async def _generate_plan_for_temperature(self, llm, base_prompt: str, temperature: float) -> TTCItem:
|
|
62
|
+
bound_llm = llm.bind(temperature=temperature)
|
|
63
|
+
response = await bound_llm.ainvoke(base_prompt)
|
|
64
|
+
cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
|
|
65
|
+
# The plan is expected to start with "PLAN:" and all the text after it is the plan
|
|
66
|
+
cleaned = re.sub(r'(?i)^\s*PLAN:\s*', '', cleaned).strip()
|
|
67
|
+
|
|
68
|
+
if not cleaned:
|
|
69
|
+
logger.warning(f"No plan generated for the prompt: {base_prompt}.")
|
|
70
|
+
# Return an empty PlanningItem to avoid breaking the generation loop
|
|
71
|
+
return TTCItem(plan="Plan was not generated")
|
|
72
|
+
|
|
73
|
+
return TTCItem(plan=cleaned)
|
|
74
|
+
|
|
75
|
+
async def _generate_plans_for_llm(self, llm, base_prompt: str) -> list[TTCItem]:
|
|
76
|
+
if self.config.plans_per_llm == 1:
|
|
77
|
+
temps = [self.config.min_temperature]
|
|
78
|
+
else:
|
|
79
|
+
temps = [
|
|
80
|
+
self.config.min_temperature + (i / (self.config.plans_per_llm - 1)) *
|
|
81
|
+
(self.config.max_temperature - self.config.min_temperature) for i in range(self.config.plans_per_llm)
|
|
82
|
+
]
|
|
83
|
+
tasks = [self._generate_plan_for_temperature(llm, base_prompt, temp) for temp in temps]
|
|
84
|
+
return await asyncio.gather(*tasks)
|
|
85
|
+
|
|
86
|
+
async def ainvoke(self,
|
|
87
|
+
items: list[TTCItem],
|
|
88
|
+
original_prompt: str | None = None,
|
|
89
|
+
agent_context: str | None = None,
|
|
90
|
+
**kwargs) -> list[TTCItem]:
|
|
91
|
+
"""
|
|
92
|
+
Generate a list of PlanningItems by querying each LLM in self.llms_bound.
|
|
93
|
+
Each LLM produces 'plans_per_llm' plans.
|
|
94
|
+
"""
|
|
95
|
+
try:
|
|
96
|
+
from langchain_core.prompts import PromptTemplate
|
|
97
|
+
except ImportError:
|
|
98
|
+
raise ImportError("langchain-core is not installed. Please install it to use MultiLLMPlanner.\n"
|
|
99
|
+
"This error can be resolve by installing nvidia-nat-langchain.")
|
|
100
|
+
|
|
101
|
+
# Create a single PromptTemplate
|
|
102
|
+
planning_template = PromptTemplate(template=self.config.planning_template,
|
|
103
|
+
input_variables=["context", "prompt"],
|
|
104
|
+
validate_template=True)
|
|
105
|
+
|
|
106
|
+
# Format the prompt once
|
|
107
|
+
base_prompt = (await planning_template.ainvoke({
|
|
108
|
+
"context": agent_context, "prompt": original_prompt
|
|
109
|
+
})).to_string()
|
|
110
|
+
|
|
111
|
+
# Launch generation for each llm concurrently using the new helper method
|
|
112
|
+
tasks = [self._generate_plans_for_llm(llm, base_prompt) for llm in self.llms_bound]
|
|
113
|
+
results_nested = await asyncio.gather(*tasks)
|
|
114
|
+
|
|
115
|
+
# Flatten the nested lists of TTCItem
|
|
116
|
+
all_plans: list[TTCItem] = [p for sub in results_nested for p in sub]
|
|
117
|
+
logger.info("MultiLLMPlanner generated %d plans total.", len(all_plans))
|
|
118
|
+
return all_plans
|
|
119
|
+
|
|
120
|
+
|
|
121
|
+
@register_ttc_strategy(config_type=MultiLLMPlanConfig)
|
|
122
|
+
async def register_multi_llm_planner(config: MultiLLMPlanConfig, builder: Builder):
|
|
123
|
+
"""
|
|
124
|
+
Register the MultiLLMPlanner strategy with the provided configuration.
|
|
125
|
+
"""
|
|
126
|
+
planner = MultiLLMPlanner(config)
|
|
127
|
+
await planner.build_components(builder)
|
|
128
|
+
yield planner
|
|
@@ -0,0 +1,122 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from nat.builder.builder import Builder
|
|
19
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
20
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
21
|
+
from nat.experimental.test_time_compute.models.search_config import MultiQueryRetrievalSearchConfig
|
|
22
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
23
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
24
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
25
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
26
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
27
|
+
|
|
28
|
+
logger = logging.getLogger(__name__)
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
class MultiQueryRetrievalSearch(StrategyBase):
|
|
32
|
+
"""
|
|
33
|
+
A strategy that, for each incoming TTCItem, generates multiple new items by
|
|
34
|
+
re-writing the input 'task_description' from different perspectives.
|
|
35
|
+
Uses multiple LLMs to encourage diversity.
|
|
36
|
+
"""
|
|
37
|
+
|
|
38
|
+
def __init__(self, config: MultiQueryRetrievalSearchConfig) -> None:
|
|
39
|
+
super().__init__(config)
|
|
40
|
+
self.config = config
|
|
41
|
+
self.llms_bound = []
|
|
42
|
+
|
|
43
|
+
async def build_components(self, builder: Builder) -> None:
|
|
44
|
+
"""
|
|
45
|
+
Binds each LLMRef in self.config.llms to an actual LLM client.
|
|
46
|
+
"""
|
|
47
|
+
self.llms_bound = []
|
|
48
|
+
for llm_ref in self.config.llms:
|
|
49
|
+
bound_llm = await builder.get_llm(llm_ref, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
50
|
+
self.llms_bound.append(bound_llm)
|
|
51
|
+
|
|
52
|
+
def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
|
|
53
|
+
return [PipelineTypeEnum.TOOL_USE]
|
|
54
|
+
|
|
55
|
+
def stage_type(self) -> StageTypeEnum:
|
|
56
|
+
return StageTypeEnum.SEARCH
|
|
57
|
+
|
|
58
|
+
async def ainvoke(self,
|
|
59
|
+
items: list[TTCItem],
|
|
60
|
+
original_prompt: str | None = None,
|
|
61
|
+
agent_context: str | None = None,
|
|
62
|
+
**kwargs) -> list[TTCItem]:
|
|
63
|
+
"""
|
|
64
|
+
For each TTCItem, rewrite the 'input' using each LLM to create a new perspective.
|
|
65
|
+
The new TTCItems' 'output' field will store the newly generated query.
|
|
66
|
+
"""
|
|
67
|
+
try:
|
|
68
|
+
from langchain_core.prompts import PromptTemplate
|
|
69
|
+
except ImportError:
|
|
70
|
+
raise ImportError("langchain-core is required for MultiQueryRetrievalSearch. "
|
|
71
|
+
"Install nvidia-nat-langchain or similar.")
|
|
72
|
+
|
|
73
|
+
new_ttc_items: list[TTCItem] = []
|
|
74
|
+
|
|
75
|
+
# Create a single PromptTemplate object for rewriting the query
|
|
76
|
+
template_vars = ["task", "motivation"]
|
|
77
|
+
query_template = PromptTemplate(template=self.config.query_generation_template,
|
|
78
|
+
input_variables=template_vars,
|
|
79
|
+
validate_template=True)
|
|
80
|
+
|
|
81
|
+
for item in items:
|
|
82
|
+
original_task = str(item.input) or ""
|
|
83
|
+
motivation = str(item.metadata) if item.metadata else ""
|
|
84
|
+
new_ttc_items.append(
|
|
85
|
+
TTCItem(
|
|
86
|
+
input=item.input,
|
|
87
|
+
output=item.input,
|
|
88
|
+
metadata=item.metadata,
|
|
89
|
+
name=item.name, # keep the original tool name
|
|
90
|
+
))
|
|
91
|
+
|
|
92
|
+
for llm in self.llms_bound:
|
|
93
|
+
prompt_str = (await query_template.ainvoke({
|
|
94
|
+
"task": original_task, "motivation": motivation
|
|
95
|
+
})).to_string()
|
|
96
|
+
|
|
97
|
+
# We'll call each LLM to produce a new query
|
|
98
|
+
response = await llm.ainvoke(prompt_str)
|
|
99
|
+
cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
|
|
100
|
+
cleaned = cleaned.strip()
|
|
101
|
+
|
|
102
|
+
# Create a new TTCItem for each newly generated query
|
|
103
|
+
new_item = TTCItem(
|
|
104
|
+
input=item.input, # keep the original input for reference
|
|
105
|
+
output=cleaned, # store the newly generated query in the output
|
|
106
|
+
metadata=item.metadata,
|
|
107
|
+
name=item.name, # same tool name or optional new name
|
|
108
|
+
)
|
|
109
|
+
new_ttc_items.append(new_item)
|
|
110
|
+
|
|
111
|
+
logger.info("MultiQueryRetrievalSearch produced %d new items from %d original items.",
|
|
112
|
+
len(new_ttc_items),
|
|
113
|
+
len(items))
|
|
114
|
+
|
|
115
|
+
return new_ttc_items
|
|
116
|
+
|
|
117
|
+
|
|
118
|
+
@register_ttc_strategy(config_type=MultiQueryRetrievalSearchConfig)
|
|
119
|
+
async def register_multi_query_retrieval_search(config: MultiQueryRetrievalSearchConfig, builder: Builder):
|
|
120
|
+
strategy = MultiQueryRetrievalSearch(config)
|
|
121
|
+
await strategy.build_components(builder)
|
|
122
|
+
yield strategy
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import asyncio
|
|
17
|
+
import logging
|
|
18
|
+
import re
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
23
|
+
from nat.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
24
|
+
from nat.experimental.test_time_compute.models.search_config import SingleShotMultiPlanConfig
|
|
25
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
26
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
27
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
28
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
29
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
30
|
+
|
|
31
|
+
logger = logging.getLogger(__name__)
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class SingleShotMultiPlanPlanner(StrategyBase):
|
|
35
|
+
"""
|
|
36
|
+
Implementation of the Single Shot Multi Plan Planner.
|
|
37
|
+
This planner generates multiple plans in a single shot.
|
|
38
|
+
"""
|
|
39
|
+
|
|
40
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
41
|
+
super().__init__(config)
|
|
42
|
+
self.llm_bound = None
|
|
43
|
+
|
|
44
|
+
async def build_components(self, builder: Builder) -> None:
|
|
45
|
+
self.llm_bound = await builder.get_llm(self.config.planning_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
46
|
+
|
|
47
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
48
|
+
return [PipelineTypeEnum.PLANNING]
|
|
49
|
+
|
|
50
|
+
def stage_type(self) -> StageTypeEnum:
|
|
51
|
+
return StageTypeEnum.SEARCH
|
|
52
|
+
|
|
53
|
+
async def ainvoke(self,
|
|
54
|
+
items: list[TTCItem],
|
|
55
|
+
original_prompt: str | None = None,
|
|
56
|
+
agent_context: str | None = None,
|
|
57
|
+
**kwargs) -> list[TTCItem]:
|
|
58
|
+
"""
|
|
59
|
+
Generate a TTCItem based on the provided prompt.
|
|
60
|
+
"""
|
|
61
|
+
|
|
62
|
+
try:
|
|
63
|
+
from langchain_core.language_models import BaseChatModel
|
|
64
|
+
from langchain_core.prompts import PromptTemplate
|
|
65
|
+
except ImportError:
|
|
66
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
67
|
+
"This error can be resolve by installing nvidia-nat-langchain.")
|
|
68
|
+
|
|
69
|
+
planning_template = PromptTemplate(template=self.config.planning_template,
|
|
70
|
+
input_variables=["context", "prompt"],
|
|
71
|
+
validate_template=True)
|
|
72
|
+
prompt = (await planning_template.ainvoke(input={
|
|
73
|
+
"context": agent_context, "prompt": original_prompt
|
|
74
|
+
})).to_string()
|
|
75
|
+
|
|
76
|
+
# assert self.config.planning llm is a BaseChatModel
|
|
77
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
78
|
+
raise ValueError("The `planning_llm` must be an instance of `BaseChatModel`.")
|
|
79
|
+
|
|
80
|
+
model: BaseChatModel = self.llm_bound
|
|
81
|
+
|
|
82
|
+
async def generate_plan(llm: BaseChatModel, plan_prompt: str, temperature: float) -> TTCItem:
|
|
83
|
+
"""
|
|
84
|
+
Helper function to generate a plan using the provided prompt and temperature.
|
|
85
|
+
"""
|
|
86
|
+
llm_bound = llm.bind(temperature=temperature)
|
|
87
|
+
response = await llm_bound.ainvoke(plan_prompt)
|
|
88
|
+
cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
|
|
89
|
+
|
|
90
|
+
# Plan will be the string following 'PLAN:'. Use Regex tpo extract
|
|
91
|
+
cleaned = re.sub(r'(?i)^\s*PLAN:\s*', '', cleaned).strip()
|
|
92
|
+
|
|
93
|
+
if not cleaned:
|
|
94
|
+
logger.warning(f"No plan generated for the prompt: {plan_prompt}.")
|
|
95
|
+
# Return an empty PlanningItem to avoid breaking the generation loop
|
|
96
|
+
return TTCItem(plan="Plan was not generated")
|
|
97
|
+
|
|
98
|
+
return TTCItem(plan=cleaned)
|
|
99
|
+
|
|
100
|
+
# Define a list of temperatures based on min and max temperature in the config and number of plans to generate
|
|
101
|
+
temperatures = [
|
|
102
|
+
self.config.min_temperature + (i / (self.config.num_plans - 1)) *
|
|
103
|
+
(self.config.max_temperature - self.config.min_temperature) for i in range(self.config.num_plans)
|
|
104
|
+
]
|
|
105
|
+
|
|
106
|
+
# Generate plans using the defined temperatures in parallel using asyncio
|
|
107
|
+
tasks = [generate_plan(model, prompt, temperature) for temperature in temperatures]
|
|
108
|
+
# Run the tasks concurrently and gather results
|
|
109
|
+
plans = await asyncio.gather(*tasks)
|
|
110
|
+
|
|
111
|
+
if not plans:
|
|
112
|
+
raise ValueError("No plans were generated. Please check the LLM response.")
|
|
113
|
+
|
|
114
|
+
logger.info("Generated %d plans from the SingleShotMultiPlanPlanner", self.config.num_plans)
|
|
115
|
+
|
|
116
|
+
logger.debug("Generated plans: %s", [plan.dict() for plan in plans])
|
|
117
|
+
|
|
118
|
+
return plans
|
|
119
|
+
|
|
120
|
+
|
|
121
|
+
@register_ttc_strategy(config_type=SingleShotMultiPlanConfig)
|
|
122
|
+
async def register_single_shot_multi_plan_planner(config: SingleShotMultiPlanConfig, builder: Builder):
|
|
123
|
+
"""
|
|
124
|
+
Register the SingleShotMultiPlanPlanner strategy with the provided configuration.
|
|
125
|
+
"""
|
|
126
|
+
planner = SingleShotMultiPlanPlanner(config)
|
|
127
|
+
await planner.build_components(builder)
|
|
128
|
+
yield planner
|
|
File without changes
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from nat.builder.builder import Builder
|
|
19
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
20
|
+
from nat.experimental.test_time_compute.models.selection_config import BestOfNSelectionConfig
|
|
21
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
22
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
23
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
24
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
25
|
+
|
|
26
|
+
logger = logging.getLogger(__name__)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class BestOfNSelector(StrategyBase):
|
|
30
|
+
|
|
31
|
+
async def build_components(self, builder: Builder) -> None:
|
|
32
|
+
pass
|
|
33
|
+
|
|
34
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
35
|
+
return [PipelineTypeEnum.PLANNING, PipelineTypeEnum.AGENT_EXECUTION, PipelineTypeEnum.TOOL_USE]
|
|
36
|
+
|
|
37
|
+
def stage_type(self) -> StageTypeEnum:
|
|
38
|
+
return StageTypeEnum.SELECTION
|
|
39
|
+
|
|
40
|
+
async def ainvoke(self,
|
|
41
|
+
items: list[TTCItem],
|
|
42
|
+
original_prompt: str | None = None,
|
|
43
|
+
agent_context: str | None = None,
|
|
44
|
+
**kwargs) -> [TTCItem]:
|
|
45
|
+
|
|
46
|
+
# Assert that every planning item has a non NoneType score
|
|
47
|
+
for item in items:
|
|
48
|
+
if item.score is None:
|
|
49
|
+
raise ValueError("Every planning item must have a score. Did you use a scorer before this?")
|
|
50
|
+
|
|
51
|
+
# Pick the planning item with the highest score
|
|
52
|
+
best_item = max(items, key=lambda x: x.score)
|
|
53
|
+
|
|
54
|
+
return [best_item]
|
|
55
|
+
|
|
56
|
+
|
|
57
|
+
@register_ttc_strategy(config_type=BestOfNSelectionConfig)
|
|
58
|
+
async def register_best_of_n_selector(config: BestOfNSelectionConfig, builder: Builder):
|
|
59
|
+
"""
|
|
60
|
+
Register the BestOfNSelector strategy.
|
|
61
|
+
"""
|
|
62
|
+
selector = BestOfNSelector(config)
|
|
63
|
+
yield selector
|