nvidia-nat 1.2.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/__init__.py +66 -0
- nat/agent/__init__.py +0 -0
- nat/agent/base.py +256 -0
- nat/agent/dual_node.py +67 -0
- nat/agent/react_agent/__init__.py +0 -0
- nat/agent/react_agent/agent.py +363 -0
- nat/agent/react_agent/output_parser.py +104 -0
- nat/agent/react_agent/prompt.py +44 -0
- nat/agent/react_agent/register.py +149 -0
- nat/agent/reasoning_agent/__init__.py +0 -0
- nat/agent/reasoning_agent/reasoning_agent.py +225 -0
- nat/agent/register.py +23 -0
- nat/agent/rewoo_agent/__init__.py +0 -0
- nat/agent/rewoo_agent/agent.py +415 -0
- nat/agent/rewoo_agent/prompt.py +110 -0
- nat/agent/rewoo_agent/register.py +157 -0
- nat/agent/tool_calling_agent/__init__.py +0 -0
- nat/agent/tool_calling_agent/agent.py +119 -0
- nat/agent/tool_calling_agent/register.py +106 -0
- nat/authentication/__init__.py +14 -0
- nat/authentication/api_key/__init__.py +14 -0
- nat/authentication/api_key/api_key_auth_provider.py +96 -0
- nat/authentication/api_key/api_key_auth_provider_config.py +124 -0
- nat/authentication/api_key/register.py +26 -0
- nat/authentication/exceptions/__init__.py +14 -0
- nat/authentication/exceptions/api_key_exceptions.py +38 -0
- nat/authentication/http_basic_auth/__init__.py +0 -0
- nat/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- nat/authentication/http_basic_auth/register.py +30 -0
- nat/authentication/interfaces.py +93 -0
- nat/authentication/oauth2/__init__.py +14 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- nat/authentication/oauth2/register.py +25 -0
- nat/authentication/register.py +21 -0
- nat/builder/__init__.py +0 -0
- nat/builder/builder.py +285 -0
- nat/builder/component_utils.py +316 -0
- nat/builder/context.py +270 -0
- nat/builder/embedder.py +24 -0
- nat/builder/eval_builder.py +161 -0
- nat/builder/evaluator.py +29 -0
- nat/builder/framework_enum.py +24 -0
- nat/builder/front_end.py +73 -0
- nat/builder/function.py +344 -0
- nat/builder/function_base.py +380 -0
- nat/builder/function_info.py +627 -0
- nat/builder/intermediate_step_manager.py +174 -0
- nat/builder/llm.py +25 -0
- nat/builder/retriever.py +25 -0
- nat/builder/user_interaction_manager.py +78 -0
- nat/builder/workflow.py +148 -0
- nat/builder/workflow_builder.py +1117 -0
- nat/cli/__init__.py +14 -0
- nat/cli/cli_utils/__init__.py +0 -0
- nat/cli/cli_utils/config_override.py +231 -0
- nat/cli/cli_utils/validation.py +37 -0
- nat/cli/commands/__init__.py +0 -0
- nat/cli/commands/configure/__init__.py +0 -0
- nat/cli/commands/configure/channel/__init__.py +0 -0
- nat/cli/commands/configure/channel/add.py +28 -0
- nat/cli/commands/configure/channel/channel.py +34 -0
- nat/cli/commands/configure/channel/remove.py +30 -0
- nat/cli/commands/configure/channel/update.py +30 -0
- nat/cli/commands/configure/configure.py +33 -0
- nat/cli/commands/evaluate.py +139 -0
- nat/cli/commands/info/__init__.py +14 -0
- nat/cli/commands/info/info.py +37 -0
- nat/cli/commands/info/list_channels.py +32 -0
- nat/cli/commands/info/list_components.py +129 -0
- nat/cli/commands/info/list_mcp.py +304 -0
- nat/cli/commands/registry/__init__.py +14 -0
- nat/cli/commands/registry/publish.py +88 -0
- nat/cli/commands/registry/pull.py +118 -0
- nat/cli/commands/registry/registry.py +36 -0
- nat/cli/commands/registry/remove.py +108 -0
- nat/cli/commands/registry/search.py +155 -0
- nat/cli/commands/sizing/__init__.py +14 -0
- nat/cli/commands/sizing/calc.py +297 -0
- nat/cli/commands/sizing/sizing.py +27 -0
- nat/cli/commands/start.py +246 -0
- nat/cli/commands/uninstall.py +81 -0
- nat/cli/commands/validate.py +47 -0
- nat/cli/commands/workflow/__init__.py +14 -0
- nat/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- nat/cli/commands/workflow/templates/config.yml.j2 +16 -0
- nat/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- nat/cli/commands/workflow/templates/register.py.j2 +5 -0
- nat/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- nat/cli/commands/workflow/workflow.py +37 -0
- nat/cli/commands/workflow/workflow_commands.py +317 -0
- nat/cli/entrypoint.py +135 -0
- nat/cli/main.py +57 -0
- nat/cli/register_workflow.py +488 -0
- nat/cli/type_registry.py +1000 -0
- nat/data_models/__init__.py +14 -0
- nat/data_models/api_server.py +716 -0
- nat/data_models/authentication.py +231 -0
- nat/data_models/common.py +171 -0
- nat/data_models/component.py +58 -0
- nat/data_models/component_ref.py +168 -0
- nat/data_models/config.py +410 -0
- nat/data_models/dataset_handler.py +169 -0
- nat/data_models/discovery_metadata.py +305 -0
- nat/data_models/embedder.py +27 -0
- nat/data_models/evaluate.py +127 -0
- nat/data_models/evaluator.py +26 -0
- nat/data_models/front_end.py +26 -0
- nat/data_models/function.py +30 -0
- nat/data_models/function_dependencies.py +72 -0
- nat/data_models/interactive.py +246 -0
- nat/data_models/intermediate_step.py +302 -0
- nat/data_models/invocation_node.py +38 -0
- nat/data_models/llm.py +27 -0
- nat/data_models/logging.py +26 -0
- nat/data_models/memory.py +27 -0
- nat/data_models/object_store.py +44 -0
- nat/data_models/profiler.py +54 -0
- nat/data_models/registry_handler.py +26 -0
- nat/data_models/retriever.py +30 -0
- nat/data_models/retry_mixin.py +35 -0
- nat/data_models/span.py +190 -0
- nat/data_models/step_adaptor.py +64 -0
- nat/data_models/streaming.py +33 -0
- nat/data_models/swe_bench_model.py +54 -0
- nat/data_models/telemetry_exporter.py +26 -0
- nat/data_models/ttc_strategy.py +30 -0
- nat/embedder/__init__.py +0 -0
- nat/embedder/nim_embedder.py +59 -0
- nat/embedder/openai_embedder.py +43 -0
- nat/embedder/register.py +22 -0
- nat/eval/__init__.py +14 -0
- nat/eval/config.py +60 -0
- nat/eval/dataset_handler/__init__.py +0 -0
- nat/eval/dataset_handler/dataset_downloader.py +106 -0
- nat/eval/dataset_handler/dataset_filter.py +52 -0
- nat/eval/dataset_handler/dataset_handler.py +367 -0
- nat/eval/evaluate.py +510 -0
- nat/eval/evaluator/__init__.py +14 -0
- nat/eval/evaluator/base_evaluator.py +77 -0
- nat/eval/evaluator/evaluator_model.py +45 -0
- nat/eval/intermediate_step_adapter.py +99 -0
- nat/eval/rag_evaluator/__init__.py +0 -0
- nat/eval/rag_evaluator/evaluate.py +178 -0
- nat/eval/rag_evaluator/register.py +143 -0
- nat/eval/register.py +23 -0
- nat/eval/remote_workflow.py +133 -0
- nat/eval/runners/__init__.py +14 -0
- nat/eval/runners/config.py +39 -0
- nat/eval/runners/multi_eval_runner.py +54 -0
- nat/eval/runtime_event_subscriber.py +52 -0
- nat/eval/swe_bench_evaluator/__init__.py +0 -0
- nat/eval/swe_bench_evaluator/evaluate.py +215 -0
- nat/eval/swe_bench_evaluator/register.py +36 -0
- nat/eval/trajectory_evaluator/__init__.py +0 -0
- nat/eval/trajectory_evaluator/evaluate.py +75 -0
- nat/eval/trajectory_evaluator/register.py +40 -0
- nat/eval/tunable_rag_evaluator/__init__.py +0 -0
- nat/eval/tunable_rag_evaluator/evaluate.py +245 -0
- nat/eval/tunable_rag_evaluator/register.py +52 -0
- nat/eval/usage_stats.py +41 -0
- nat/eval/utils/__init__.py +0 -0
- nat/eval/utils/output_uploader.py +140 -0
- nat/eval/utils/tqdm_position_registry.py +40 -0
- nat/eval/utils/weave_eval.py +184 -0
- nat/experimental/__init__.py +0 -0
- nat/experimental/decorators/__init__.py +0 -0
- nat/experimental/decorators/experimental_warning_decorator.py +134 -0
- nat/experimental/test_time_compute/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- nat/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- nat/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- nat/experimental/test_time_compute/functions/__init__.py +0 -0
- nat/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- nat/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +205 -0
- nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +146 -0
- nat/experimental/test_time_compute/models/__init__.py +0 -0
- nat/experimental/test_time_compute/models/editor_config.py +132 -0
- nat/experimental/test_time_compute/models/scoring_config.py +112 -0
- nat/experimental/test_time_compute/models/search_config.py +120 -0
- nat/experimental/test_time_compute/models/selection_config.py +154 -0
- nat/experimental/test_time_compute/models/stage_enums.py +43 -0
- nat/experimental/test_time_compute/models/strategy_base.py +66 -0
- nat/experimental/test_time_compute/models/tool_use_config.py +41 -0
- nat/experimental/test_time_compute/models/ttc_item.py +48 -0
- nat/experimental/test_time_compute/register.py +36 -0
- nat/experimental/test_time_compute/scoring/__init__.py +0 -0
- nat/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- nat/experimental/test_time_compute/search/__init__.py +0 -0
- nat/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- nat/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- nat/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- nat/experimental/test_time_compute/selection/__init__.py +0 -0
- nat/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- nat/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- nat/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- nat/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- nat/front_ends/__init__.py +14 -0
- nat/front_ends/console/__init__.py +14 -0
- nat/front_ends/console/authentication_flow_handler.py +233 -0
- nat/front_ends/console/console_front_end_config.py +32 -0
- nat/front_ends/console/console_front_end_plugin.py +96 -0
- nat/front_ends/console/register.py +25 -0
- nat/front_ends/cron/__init__.py +14 -0
- nat/front_ends/fastapi/__init__.py +14 -0
- nat/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- nat/front_ends/fastapi/fastapi_front_end_config.py +241 -0
- nat/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1087 -0
- nat/front_ends/fastapi/html_snippets/__init__.py +14 -0
- nat/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- nat/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- nat/front_ends/fastapi/job_store.py +183 -0
- nat/front_ends/fastapi/main.py +72 -0
- nat/front_ends/fastapi/message_handler.py +320 -0
- nat/front_ends/fastapi/message_validator.py +352 -0
- nat/front_ends/fastapi/register.py +25 -0
- nat/front_ends/fastapi/response_helpers.py +195 -0
- nat/front_ends/fastapi/step_adaptor.py +319 -0
- nat/front_ends/mcp/__init__.py +14 -0
- nat/front_ends/mcp/mcp_front_end_config.py +36 -0
- nat/front_ends/mcp/mcp_front_end_plugin.py +81 -0
- nat/front_ends/mcp/mcp_front_end_plugin_worker.py +143 -0
- nat/front_ends/mcp/register.py +27 -0
- nat/front_ends/mcp/tool_converter.py +241 -0
- nat/front_ends/register.py +22 -0
- nat/front_ends/simple_base/__init__.py +14 -0
- nat/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- nat/llm/__init__.py +0 -0
- nat/llm/aws_bedrock_llm.py +57 -0
- nat/llm/nim_llm.py +46 -0
- nat/llm/openai_llm.py +46 -0
- nat/llm/register.py +23 -0
- nat/llm/utils/__init__.py +14 -0
- nat/llm/utils/env_config_value.py +94 -0
- nat/llm/utils/error.py +17 -0
- nat/memory/__init__.py +20 -0
- nat/memory/interfaces.py +183 -0
- nat/memory/models.py +112 -0
- nat/meta/pypi.md +58 -0
- nat/object_store/__init__.py +20 -0
- nat/object_store/in_memory_object_store.py +76 -0
- nat/object_store/interfaces.py +84 -0
- nat/object_store/models.py +38 -0
- nat/object_store/register.py +20 -0
- nat/observability/__init__.py +14 -0
- nat/observability/exporter/__init__.py +14 -0
- nat/observability/exporter/base_exporter.py +449 -0
- nat/observability/exporter/exporter.py +78 -0
- nat/observability/exporter/file_exporter.py +33 -0
- nat/observability/exporter/processing_exporter.py +322 -0
- nat/observability/exporter/raw_exporter.py +52 -0
- nat/observability/exporter/span_exporter.py +288 -0
- nat/observability/exporter_manager.py +335 -0
- nat/observability/mixin/__init__.py +14 -0
- nat/observability/mixin/batch_config_mixin.py +26 -0
- nat/observability/mixin/collector_config_mixin.py +23 -0
- nat/observability/mixin/file_mixin.py +288 -0
- nat/observability/mixin/file_mode.py +23 -0
- nat/observability/mixin/resource_conflict_mixin.py +134 -0
- nat/observability/mixin/serialize_mixin.py +61 -0
- nat/observability/mixin/type_introspection_mixin.py +183 -0
- nat/observability/processor/__init__.py +14 -0
- nat/observability/processor/batching_processor.py +310 -0
- nat/observability/processor/callback_processor.py +42 -0
- nat/observability/processor/intermediate_step_serializer.py +28 -0
- nat/observability/processor/processor.py +71 -0
- nat/observability/register.py +96 -0
- nat/observability/utils/__init__.py +14 -0
- nat/observability/utils/dict_utils.py +236 -0
- nat/observability/utils/time_utils.py +31 -0
- nat/plugins/.namespace +1 -0
- nat/profiler/__init__.py +0 -0
- nat/profiler/calc/__init__.py +14 -0
- nat/profiler/calc/calc_runner.py +627 -0
- nat/profiler/calc/calculations.py +288 -0
- nat/profiler/calc/data_models.py +188 -0
- nat/profiler/calc/plot.py +345 -0
- nat/profiler/callbacks/__init__.py +0 -0
- nat/profiler/callbacks/agno_callback_handler.py +295 -0
- nat/profiler/callbacks/base_callback_class.py +20 -0
- nat/profiler/callbacks/langchain_callback_handler.py +290 -0
- nat/profiler/callbacks/llama_index_callback_handler.py +205 -0
- nat/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- nat/profiler/callbacks/token_usage_base_model.py +27 -0
- nat/profiler/data_frame_row.py +51 -0
- nat/profiler/data_models.py +24 -0
- nat/profiler/decorators/__init__.py +0 -0
- nat/profiler/decorators/framework_wrapper.py +131 -0
- nat/profiler/decorators/function_tracking.py +254 -0
- nat/profiler/forecasting/__init__.py +0 -0
- nat/profiler/forecasting/config.py +18 -0
- nat/profiler/forecasting/model_trainer.py +75 -0
- nat/profiler/forecasting/models/__init__.py +22 -0
- nat/profiler/forecasting/models/forecasting_base_model.py +40 -0
- nat/profiler/forecasting/models/linear_model.py +197 -0
- nat/profiler/forecasting/models/random_forest_regressor.py +269 -0
- nat/profiler/inference_metrics_model.py +28 -0
- nat/profiler/inference_optimization/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- nat/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- nat/profiler/inference_optimization/data_models.py +386 -0
- nat/profiler/inference_optimization/experimental/__init__.py +0 -0
- nat/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- nat/profiler/inference_optimization/llm_metrics.py +212 -0
- nat/profiler/inference_optimization/prompt_caching.py +163 -0
- nat/profiler/inference_optimization/token_uniqueness.py +107 -0
- nat/profiler/inference_optimization/workflow_runtimes.py +72 -0
- nat/profiler/intermediate_property_adapter.py +102 -0
- nat/profiler/profile_runner.py +473 -0
- nat/profiler/utils.py +184 -0
- nat/registry_handlers/__init__.py +0 -0
- nat/registry_handlers/local/__init__.py +0 -0
- nat/registry_handlers/local/local_handler.py +176 -0
- nat/registry_handlers/local/register_local.py +37 -0
- nat/registry_handlers/metadata_factory.py +60 -0
- nat/registry_handlers/package_utils.py +571 -0
- nat/registry_handlers/pypi/__init__.py +0 -0
- nat/registry_handlers/pypi/pypi_handler.py +251 -0
- nat/registry_handlers/pypi/register_pypi.py +40 -0
- nat/registry_handlers/register.py +21 -0
- nat/registry_handlers/registry_handler_base.py +157 -0
- nat/registry_handlers/rest/__init__.py +0 -0
- nat/registry_handlers/rest/register_rest.py +56 -0
- nat/registry_handlers/rest/rest_handler.py +237 -0
- nat/registry_handlers/schemas/__init__.py +0 -0
- nat/registry_handlers/schemas/headers.py +42 -0
- nat/registry_handlers/schemas/package.py +68 -0
- nat/registry_handlers/schemas/publish.py +68 -0
- nat/registry_handlers/schemas/pull.py +82 -0
- nat/registry_handlers/schemas/remove.py +36 -0
- nat/registry_handlers/schemas/search.py +91 -0
- nat/registry_handlers/schemas/status.py +47 -0
- nat/retriever/__init__.py +0 -0
- nat/retriever/interface.py +41 -0
- nat/retriever/milvus/__init__.py +14 -0
- nat/retriever/milvus/register.py +81 -0
- nat/retriever/milvus/retriever.py +228 -0
- nat/retriever/models.py +77 -0
- nat/retriever/nemo_retriever/__init__.py +14 -0
- nat/retriever/nemo_retriever/register.py +60 -0
- nat/retriever/nemo_retriever/retriever.py +190 -0
- nat/retriever/register.py +22 -0
- nat/runtime/__init__.py +14 -0
- nat/runtime/loader.py +220 -0
- nat/runtime/runner.py +195 -0
- nat/runtime/session.py +162 -0
- nat/runtime/user_metadata.py +130 -0
- nat/settings/__init__.py +0 -0
- nat/settings/global_settings.py +318 -0
- nat/test/.namespace +1 -0
- nat/tool/__init__.py +0 -0
- nat/tool/chat_completion.py +74 -0
- nat/tool/code_execution/README.md +151 -0
- nat/tool/code_execution/__init__.py +0 -0
- nat/tool/code_execution/code_sandbox.py +267 -0
- nat/tool/code_execution/local_sandbox/.gitignore +1 -0
- nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- nat/tool/code_execution/local_sandbox/__init__.py +13 -0
- nat/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- nat/tool/code_execution/register.py +74 -0
- nat/tool/code_execution/test_code_execution_sandbox.py +414 -0
- nat/tool/code_execution/utils.py +100 -0
- nat/tool/datetime_tools.py +42 -0
- nat/tool/document_search.py +141 -0
- nat/tool/github_tools/__init__.py +0 -0
- nat/tool/github_tools/create_github_commit.py +133 -0
- nat/tool/github_tools/create_github_issue.py +87 -0
- nat/tool/github_tools/create_github_pr.py +106 -0
- nat/tool/github_tools/get_github_file.py +106 -0
- nat/tool/github_tools/get_github_issue.py +166 -0
- nat/tool/github_tools/get_github_pr.py +256 -0
- nat/tool/github_tools/update_github_issue.py +100 -0
- nat/tool/mcp/__init__.py +14 -0
- nat/tool/mcp/exceptions.py +142 -0
- nat/tool/mcp/mcp_client.py +255 -0
- nat/tool/mcp/mcp_tool.py +96 -0
- nat/tool/memory_tools/__init__.py +0 -0
- nat/tool/memory_tools/add_memory_tool.py +79 -0
- nat/tool/memory_tools/delete_memory_tool.py +67 -0
- nat/tool/memory_tools/get_memory_tool.py +72 -0
- nat/tool/nvidia_rag.py +95 -0
- nat/tool/register.py +38 -0
- nat/tool/retriever.py +94 -0
- nat/tool/server_tools.py +66 -0
- nat/utils/__init__.py +0 -0
- nat/utils/data_models/__init__.py +0 -0
- nat/utils/data_models/schema_validator.py +58 -0
- nat/utils/debugging_utils.py +43 -0
- nat/utils/dump_distro_mapping.py +32 -0
- nat/utils/exception_handlers/__init__.py +0 -0
- nat/utils/exception_handlers/automatic_retries.py +289 -0
- nat/utils/exception_handlers/mcp.py +211 -0
- nat/utils/exception_handlers/schemas.py +114 -0
- nat/utils/io/__init__.py +0 -0
- nat/utils/io/model_processing.py +28 -0
- nat/utils/io/yaml_tools.py +119 -0
- nat/utils/log_utils.py +37 -0
- nat/utils/metadata_utils.py +74 -0
- nat/utils/optional_imports.py +142 -0
- nat/utils/producer_consumer_queue.py +178 -0
- nat/utils/reactive/__init__.py +0 -0
- nat/utils/reactive/base/__init__.py +0 -0
- nat/utils/reactive/base/observable_base.py +65 -0
- nat/utils/reactive/base/observer_base.py +55 -0
- nat/utils/reactive/base/subject_base.py +79 -0
- nat/utils/reactive/observable.py +59 -0
- nat/utils/reactive/observer.py +76 -0
- nat/utils/reactive/subject.py +131 -0
- nat/utils/reactive/subscription.py +49 -0
- nat/utils/settings/__init__.py +0 -0
- nat/utils/settings/global_settings.py +197 -0
- nat/utils/string_utils.py +38 -0
- nat/utils/type_converter.py +290 -0
- nat/utils/type_utils.py +484 -0
- nat/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0.dist-info/METADATA +365 -0
- nvidia_nat-1.2.0.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0.dist-info/entry_points.txt +21 -0
- nvidia_nat-1.2.0.dist-info/licenses/LICENSE-3rd-party.txt +5478 -0
- nvidia_nat-1.2.0.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0.dist-info/top_level.txt +2 -0
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from enum import Enum
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
class PipelineTypeEnum(str, Enum):
|
|
20
|
+
"""
|
|
21
|
+
Enum to represent the type of pipeline used in Inference Time Scaling.
|
|
22
|
+
"""
|
|
23
|
+
PLANNING = "planning"
|
|
24
|
+
TOOL_USE = "tool_use"
|
|
25
|
+
AGENT_EXECUTION = "agent_execution"
|
|
26
|
+
CUSTOM = "custom"
|
|
27
|
+
|
|
28
|
+
def __str__(self) -> str:
|
|
29
|
+
return self.value
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
class StageTypeEnum(str, Enum):
|
|
33
|
+
"""
|
|
34
|
+
Enum to represent the type of stage in a pipeline.
|
|
35
|
+
"""
|
|
36
|
+
SEARCH = "search"
|
|
37
|
+
EDITING = "editing"
|
|
38
|
+
SCORING = "scoring"
|
|
39
|
+
SELECTION = "selection"
|
|
40
|
+
CUSTOM = "custom"
|
|
41
|
+
|
|
42
|
+
def __str__(self) -> str:
|
|
43
|
+
return self.value
|
|
@@ -0,0 +1,66 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from abc import ABC
|
|
17
|
+
from abc import abstractmethod
|
|
18
|
+
|
|
19
|
+
from nat.builder.builder import Builder
|
|
20
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
21
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum, PipelineTypeEnum
|
|
22
|
+
from nat.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
class StrategyBase(ABC):
|
|
26
|
+
"""
|
|
27
|
+
Abstract base class for strategy implementations.
|
|
28
|
+
|
|
29
|
+
This class defines the interface for strategies that can be used in the
|
|
30
|
+
TTC framework. Concrete strategy classes should
|
|
31
|
+
implement the methods defined in this class.
|
|
32
|
+
"""
|
|
33
|
+
|
|
34
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
35
|
+
self.config: TTCStrategyBaseConfig = config
|
|
36
|
+
self.pipeline_type: PipelineTypeEnum | None = None
|
|
37
|
+
|
|
38
|
+
@abstractmethod
|
|
39
|
+
async def build_components(self, builder: Builder) -> None:
|
|
40
|
+
"""Build the components required for the selector."""
|
|
41
|
+
pass
|
|
42
|
+
|
|
43
|
+
@abstractmethod
|
|
44
|
+
async def ainvoke(self,
|
|
45
|
+
items: list[TTCItem],
|
|
46
|
+
original_prompt: str | None = None,
|
|
47
|
+
agent_context: str | None = None,
|
|
48
|
+
**kwargs) -> [TTCItem]:
|
|
49
|
+
pass
|
|
50
|
+
|
|
51
|
+
@abstractmethod
|
|
52
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
53
|
+
"""Return the stage types supported by this selector."""
|
|
54
|
+
pass
|
|
55
|
+
|
|
56
|
+
@abstractmethod
|
|
57
|
+
def stage_type(self) -> StageTypeEnum:
|
|
58
|
+
"""Return the stage type of this strategy."""
|
|
59
|
+
pass
|
|
60
|
+
|
|
61
|
+
def set_pipeline_type(self, pipeline_type: PipelineTypeEnum) -> None:
|
|
62
|
+
"""Set the pipeline type for this strategy."""
|
|
63
|
+
if pipeline_type in self.supported_pipeline_types():
|
|
64
|
+
self.pipeline_type = pipeline_type
|
|
65
|
+
else:
|
|
66
|
+
raise ValueError(f"Pipeline type {pipeline_type} is not supported by this strategy.")
|
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import BaseModel
|
|
17
|
+
from pydantic import Field
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
class ToolUseInputSchema(BaseModel):
|
|
21
|
+
"""
|
|
22
|
+
Input schema for the tool use function.
|
|
23
|
+
"""
|
|
24
|
+
tool_name: str = Field(description="The name of the tool to use. Must be registered in the system.", )
|
|
25
|
+
task_description: str = Field(description="The description of the task to perform with the tool.", )
|
|
26
|
+
motivation: str | None = Field(
|
|
27
|
+
default=None,
|
|
28
|
+
description="An optional motivation for the tool use, providing additional context or reasoning.",
|
|
29
|
+
)
|
|
30
|
+
output: str | None = Field(
|
|
31
|
+
default=None,
|
|
32
|
+
description="The output of the tool use. This can be used to store the result of the tool execution.",
|
|
33
|
+
)
|
|
34
|
+
|
|
35
|
+
|
|
36
|
+
class ToolUselist(BaseModel):
|
|
37
|
+
"""
|
|
38
|
+
A list of tools to use.
|
|
39
|
+
"""
|
|
40
|
+
tools: list[ToolUseInputSchema] = Field(
|
|
41
|
+
description="A list of tool use inputs, each containing the tool name and task description.", )
|
|
@@ -0,0 +1,48 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from pydantic import BaseModel
|
|
19
|
+
from pydantic import ConfigDict
|
|
20
|
+
from pydantic import Field
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
class TTCItem(BaseModel):
|
|
24
|
+
"""
|
|
25
|
+
Represents an item in the TTC functions and pipelines
|
|
26
|
+
"""
|
|
27
|
+
model_config = ConfigDict(extra="allow")
|
|
28
|
+
|
|
29
|
+
input: typing.Any | None = Field(default=None,
|
|
30
|
+
description="Input to the function or pipeline. "
|
|
31
|
+
"This can be a structured tool call, or other info.")
|
|
32
|
+
output: typing.Any | None = Field(default=None,
|
|
33
|
+
description="Output from the function or pipeline. "
|
|
34
|
+
"This can be a structured tool call, or other info.")
|
|
35
|
+
plan: typing.Any | None = Field(default=None, description="Search plan for downstream agent(s).")
|
|
36
|
+
feedback: str | None = Field(default=None,
|
|
37
|
+
description="Feedback "
|
|
38
|
+
"provided by feedback steps to improve the plan.")
|
|
39
|
+
score: float | None = Field(default=None,
|
|
40
|
+
description="Score of the plan based on feedback or other evaluation criteria. "
|
|
41
|
+
"This can be used to rank plans.")
|
|
42
|
+
metadata: typing.Any | None = Field(default=None,
|
|
43
|
+
description="Additional information. This can be"
|
|
44
|
+
" a structured tool call, or other info not "
|
|
45
|
+
"in the plan.")
|
|
46
|
+
name: str | None = Field(default=None,
|
|
47
|
+
description="Name of the item or function"
|
|
48
|
+
", used for identification in pipelines.")
|
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
# pylint: disable=unused-import
|
|
17
|
+
# flake8: noqa
|
|
18
|
+
|
|
19
|
+
from .editing import iterative_plan_refinement_editor
|
|
20
|
+
from .editing import llm_as_a_judge_editor
|
|
21
|
+
from .editing import motivation_aware_summarization
|
|
22
|
+
from .functions import execute_score_select_function
|
|
23
|
+
from .functions import plan_select_execute_function
|
|
24
|
+
from .functions import ttc_tool_orchestration_function
|
|
25
|
+
from .functions import ttc_tool_wrapper_function
|
|
26
|
+
from .scoring import llm_based_agent_scorer
|
|
27
|
+
from .scoring import llm_based_plan_scorer
|
|
28
|
+
from .scoring import motivation_aware_scorer
|
|
29
|
+
from .search import multi_llm_planner
|
|
30
|
+
from .search import multi_query_retrieval_search
|
|
31
|
+
from .search import single_shot_multi_plan_planner
|
|
32
|
+
from .selection import best_of_n_selector
|
|
33
|
+
from .selection import llm_based_agent_output_selector
|
|
34
|
+
from .selection import llm_based_output_merging_selector
|
|
35
|
+
from .selection import llm_based_plan_selector
|
|
36
|
+
from .selection import threshold_selector
|
|
File without changes
|
|
@@ -0,0 +1,168 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import asyncio
|
|
17
|
+
import logging
|
|
18
|
+
import re
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
23
|
+
from nat.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
24
|
+
from nat.experimental.test_time_compute.models.scoring_config import LLMBasedAgentScoringConfig
|
|
25
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
26
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
27
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
28
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
29
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
30
|
+
|
|
31
|
+
logger = logging.getLogger(__name__)
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class LLMBasedAgentScorer(StrategyBase):
|
|
35
|
+
|
|
36
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
37
|
+
super().__init__(config)
|
|
38
|
+
self.llm_bound = None
|
|
39
|
+
|
|
40
|
+
async def build_components(self, builder: Builder) -> None:
|
|
41
|
+
"""
|
|
42
|
+
Build the components required for the planner.
|
|
43
|
+
"""
|
|
44
|
+
self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
45
|
+
|
|
46
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
47
|
+
return [PipelineTypeEnum.AGENT_EXECUTION]
|
|
48
|
+
|
|
49
|
+
def stage_type(self) -> StageTypeEnum:
|
|
50
|
+
return StageTypeEnum.SCORING
|
|
51
|
+
|
|
52
|
+
async def score_single(self, original_prompt: str, agent_context: str, item: TTCItem) -> float:
|
|
53
|
+
"""
|
|
54
|
+
Score a single planning item using the LLM.
|
|
55
|
+
|
|
56
|
+
Args:
|
|
57
|
+
original_prompt (str): The original prompt.
|
|
58
|
+
agent_context (str): The agent context.
|
|
59
|
+
item (TTCItem): The item to score.
|
|
60
|
+
|
|
61
|
+
Returns:
|
|
62
|
+
float: The score of the item.
|
|
63
|
+
"""
|
|
64
|
+
|
|
65
|
+
try:
|
|
66
|
+
from langchain_core.language_models import BaseChatModel
|
|
67
|
+
from langchain_core.prompts import PromptTemplate
|
|
68
|
+
except ImportError:
|
|
69
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
70
|
+
"This error can be resolved by installing nvidia-nat-langchain.")
|
|
71
|
+
|
|
72
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
73
|
+
raise ValueError("The `scoring_llm` must be an instance of `BaseChatModel`.")
|
|
74
|
+
|
|
75
|
+
model: BaseChatModel = self.llm_bound
|
|
76
|
+
|
|
77
|
+
prompt_template = PromptTemplate(
|
|
78
|
+
template=self.config.scoring_template,
|
|
79
|
+
input_variables=["objective", "input", "output"],
|
|
80
|
+
validate_template=True,
|
|
81
|
+
)
|
|
82
|
+
|
|
83
|
+
prompt = (await prompt_template.ainvoke(
|
|
84
|
+
input={
|
|
85
|
+
"objective": agent_context,
|
|
86
|
+
"input": str(item.input) if not original_prompt else original_prompt,
|
|
87
|
+
"output": str(item.output)
|
|
88
|
+
}))
|
|
89
|
+
|
|
90
|
+
response = (await model.ainvoke(prompt)).content
|
|
91
|
+
response = remove_r1_think_tags(response)
|
|
92
|
+
|
|
93
|
+
# Score will following the format of `FINAL SCORE: <float>` in the response from the LLM
|
|
94
|
+
if not isinstance(response, str):
|
|
95
|
+
logger.warning(f"Invalid response from LLM for scoring: {response}.")
|
|
96
|
+
raise ValueError("Unable to parse the score from the LLM response.")
|
|
97
|
+
|
|
98
|
+
response = response.strip()
|
|
99
|
+
match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
|
|
100
|
+
if not match:
|
|
101
|
+
logger.warning(f"Could not parse the score from the response: {response}.")
|
|
102
|
+
score_str = '0.0'
|
|
103
|
+
else:
|
|
104
|
+
score_str = match.group(1)
|
|
105
|
+
|
|
106
|
+
try:
|
|
107
|
+
score = float(score_str)
|
|
108
|
+
except ValueError:
|
|
109
|
+
logger.warning(f"Could not convert the score string '{score_str}' to float.")
|
|
110
|
+
raise ValueError(f"Unable to convert the extracted score '{score_str}' to a float.")
|
|
111
|
+
|
|
112
|
+
return score
|
|
113
|
+
|
|
114
|
+
async def ainvoke(self,
|
|
115
|
+
items: list[TTCItem],
|
|
116
|
+
original_prompt: str | None = None,
|
|
117
|
+
agent_context: str | None = None,
|
|
118
|
+
**kwargs) -> list[TTCItem]:
|
|
119
|
+
"""
|
|
120
|
+
Score a list of planning items.
|
|
121
|
+
|
|
122
|
+
Args:
|
|
123
|
+
original_prompt (str): The original prompt.
|
|
124
|
+
agent_context (str): The agent context.
|
|
125
|
+
items (list[TTCItem]): The list of planning items to score.
|
|
126
|
+
|
|
127
|
+
Returns:
|
|
128
|
+
list[float]: A list of scores corresponding to each planning item.
|
|
129
|
+
"""
|
|
130
|
+
# Run score single concurrently for all planning items
|
|
131
|
+
# Then set the score attribute on each planning item
|
|
132
|
+
if not items:
|
|
133
|
+
return []
|
|
134
|
+
tasks = [
|
|
135
|
+
self.score_single(original_prompt=original_prompt, agent_context=agent_context, item=item) for item in items
|
|
136
|
+
]
|
|
137
|
+
|
|
138
|
+
# Gather all scores concurrently
|
|
139
|
+
scores = await asyncio.gather(*tasks)
|
|
140
|
+
|
|
141
|
+
if len(scores) != len(items):
|
|
142
|
+
logger.warning(f"Number of scores {len(scores)} does not match the number of items {len(items)}.")
|
|
143
|
+
raise ValueError("Mismatch in number of scores and planning items.")
|
|
144
|
+
|
|
145
|
+
logger.debug("Scores for planning items: %s", scores)
|
|
146
|
+
|
|
147
|
+
# Set the score on each planning item for reference
|
|
148
|
+
for idx, score in enumerate(scores):
|
|
149
|
+
items[idx].score = score
|
|
150
|
+
|
|
151
|
+
return items
|
|
152
|
+
|
|
153
|
+
|
|
154
|
+
@register_ttc_strategy(config_type=LLMBasedAgentScoringConfig)
|
|
155
|
+
async def register_llm_based_agent_scorer(config: LLMBasedAgentScoringConfig, builder: Builder):
|
|
156
|
+
"""
|
|
157
|
+
Register the LLM-based agent scorer with the provided configuration and builder.
|
|
158
|
+
|
|
159
|
+
Args:
|
|
160
|
+
config (LLMBasedAgentScoringConfig): The configuration for the LLM-based agent scorer.
|
|
161
|
+
builder (Builder): The builder instance to use for building components.
|
|
162
|
+
|
|
163
|
+
Returns:
|
|
164
|
+
LLMBasedAgentScorer: The registered LLM-based agent scorer.
|
|
165
|
+
"""
|
|
166
|
+
scorer = LLMBasedAgentScorer(config)
|
|
167
|
+
await scorer.build_components(builder)
|
|
168
|
+
yield scorer
|
|
@@ -0,0 +1,168 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import asyncio
|
|
17
|
+
import logging
|
|
18
|
+
import re
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.cli.register_workflow import register_ttc_strategy
|
|
23
|
+
from nat.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
24
|
+
from nat.experimental.test_time_compute.models.scoring_config import LLMBasedPlanScoringConfig
|
|
25
|
+
from nat.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
26
|
+
from nat.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
27
|
+
from nat.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
28
|
+
from nat.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
29
|
+
from nat.utils.io.model_processing import remove_r1_think_tags
|
|
30
|
+
|
|
31
|
+
logger = logging.getLogger(__name__)
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class LLMBasedPlanScorer(StrategyBase):
|
|
35
|
+
|
|
36
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
37
|
+
super().__init__(config)
|
|
38
|
+
self.llm_bound = None
|
|
39
|
+
|
|
40
|
+
async def build_components(self, builder: Builder) -> None:
|
|
41
|
+
"""
|
|
42
|
+
Build the components required for the planner.
|
|
43
|
+
"""
|
|
44
|
+
self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
45
|
+
|
|
46
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
47
|
+
return [PipelineTypeEnum.PLANNING]
|
|
48
|
+
|
|
49
|
+
def stage_type(self) -> StageTypeEnum:
|
|
50
|
+
return StageTypeEnum.SCORING
|
|
51
|
+
|
|
52
|
+
async def score_single(self, original_prompt: str, agent_context: str, planning_item: TTCItem) -> float:
|
|
53
|
+
"""
|
|
54
|
+
Score a single planning item using the LLM.
|
|
55
|
+
|
|
56
|
+
Args:
|
|
57
|
+
original_prompt (str): The original prompt.
|
|
58
|
+
agent_context (str): The agent context.
|
|
59
|
+
planning_item (TTCItem): The item to score.
|
|
60
|
+
|
|
61
|
+
Returns:
|
|
62
|
+
float: The score of the item.
|
|
63
|
+
"""
|
|
64
|
+
|
|
65
|
+
try:
|
|
66
|
+
from langchain_core.language_models import BaseChatModel
|
|
67
|
+
from langchain_core.prompts import PromptTemplate
|
|
68
|
+
except ImportError:
|
|
69
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
70
|
+
"This error can be resolved by installing nvidia-nat-langchain.")
|
|
71
|
+
|
|
72
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
73
|
+
raise ValueError("The `scoring_llm` must be an instance of `BaseChatModel`.")
|
|
74
|
+
|
|
75
|
+
model: BaseChatModel = self.llm_bound
|
|
76
|
+
|
|
77
|
+
prompt_template = PromptTemplate(
|
|
78
|
+
template=self.config.scoring_template,
|
|
79
|
+
input_variables=["original_prompt", "context", "plan"],
|
|
80
|
+
validate_template=True,
|
|
81
|
+
)
|
|
82
|
+
|
|
83
|
+
prompt = (await prompt_template.ainvoke(
|
|
84
|
+
input={
|
|
85
|
+
"original_prompt": original_prompt,
|
|
86
|
+
"context": agent_context,
|
|
87
|
+
"plan": remove_r1_think_tags(planning_item.plan)
|
|
88
|
+
}))
|
|
89
|
+
|
|
90
|
+
response = (await model.ainvoke(prompt)).content
|
|
91
|
+
|
|
92
|
+
# Score will following the format of `FINAL SCORE: <float>` in the response from the LLM
|
|
93
|
+
if not isinstance(response, str):
|
|
94
|
+
logger.warning(f"Invalid response from LLM for scoring: {response}.")
|
|
95
|
+
raise ValueError("Unable to parse the score from the LLM response.")
|
|
96
|
+
|
|
97
|
+
response = response.strip()
|
|
98
|
+
match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
|
|
99
|
+
if not match:
|
|
100
|
+
logger.warning(f"Could not parse the score from the response: {response}.")
|
|
101
|
+
score_str = '0.0'
|
|
102
|
+
else:
|
|
103
|
+
score_str = match.group(1)
|
|
104
|
+
|
|
105
|
+
try:
|
|
106
|
+
score = float(score_str)
|
|
107
|
+
except ValueError:
|
|
108
|
+
logger.warning(f"Could not convert the score string '{score_str}' to float.")
|
|
109
|
+
raise ValueError(f"Unable to convert the extracted score '{score_str}' to a float.")
|
|
110
|
+
|
|
111
|
+
return score
|
|
112
|
+
|
|
113
|
+
async def ainvoke(self,
|
|
114
|
+
items: list[TTCItem],
|
|
115
|
+
original_prompt: str | None = None,
|
|
116
|
+
agent_context: str | None = None,
|
|
117
|
+
**kwargs) -> list[TTCItem]:
|
|
118
|
+
"""
|
|
119
|
+
Score a list of planning items.
|
|
120
|
+
|
|
121
|
+
Args:
|
|
122
|
+
original_prompt (str): The original prompt.
|
|
123
|
+
agent_context (str): The agent context.
|
|
124
|
+
items (list[TTCItem]): The list of planning items to score.
|
|
125
|
+
|
|
126
|
+
Returns:
|
|
127
|
+
list[float]: A list of scores corresponding to each planning item.
|
|
128
|
+
"""
|
|
129
|
+
# Run score single concurrently for all planning items
|
|
130
|
+
# Then set the score attribute on each planning item
|
|
131
|
+
if not items:
|
|
132
|
+
return []
|
|
133
|
+
tasks = [
|
|
134
|
+
self.score_single(original_prompt=original_prompt, agent_context=agent_context, planning_item=item)
|
|
135
|
+
for item in items
|
|
136
|
+
]
|
|
137
|
+
|
|
138
|
+
# Gather all scores concurrently
|
|
139
|
+
scores = await asyncio.gather(*tasks)
|
|
140
|
+
|
|
141
|
+
if len(scores) != len(items):
|
|
142
|
+
logger.warning(f"Number of scores {len(scores)} does not match the number of planning items {len(items)}.")
|
|
143
|
+
raise ValueError("Mismatch in number of scores and planning items.")
|
|
144
|
+
|
|
145
|
+
logger.debug("Scores for planning items: %s", scores)
|
|
146
|
+
|
|
147
|
+
# Set the score on each planning item for reference
|
|
148
|
+
for idx, score in enumerate(scores):
|
|
149
|
+
items[idx].score = score
|
|
150
|
+
|
|
151
|
+
return items
|
|
152
|
+
|
|
153
|
+
|
|
154
|
+
@register_ttc_strategy(config_type=LLMBasedPlanScoringConfig)
|
|
155
|
+
async def register_llm_based_plan_scorer(config: LLMBasedPlanScoringConfig, builder: Builder):
|
|
156
|
+
"""
|
|
157
|
+
Register the LLM-based plan scorer strategy.
|
|
158
|
+
|
|
159
|
+
Args:
|
|
160
|
+
config (LLMBasedPlanScoringConfig): The configuration for the strategy.
|
|
161
|
+
builder (Builder): The builder instance.
|
|
162
|
+
|
|
163
|
+
Returns:
|
|
164
|
+
LLMBasedPlanScorer: The registered LLM-based plan scorer.
|
|
165
|
+
"""
|
|
166
|
+
scorer = LLMBasedPlanScorer(config)
|
|
167
|
+
await scorer.build_components(builder)
|
|
168
|
+
yield scorer
|