nvidia-nat 1.1.0a20251020__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/__init__.py +66 -0
- nat/agent/__init__.py +0 -0
- nat/agent/base.py +265 -0
- nat/agent/dual_node.py +72 -0
- nat/agent/prompt_optimizer/__init__.py +0 -0
- nat/agent/prompt_optimizer/prompt.py +68 -0
- nat/agent/prompt_optimizer/register.py +149 -0
- nat/agent/react_agent/__init__.py +0 -0
- nat/agent/react_agent/agent.py +394 -0
- nat/agent/react_agent/output_parser.py +104 -0
- nat/agent/react_agent/prompt.py +44 -0
- nat/agent/react_agent/register.py +168 -0
- nat/agent/reasoning_agent/__init__.py +0 -0
- nat/agent/reasoning_agent/reasoning_agent.py +227 -0
- nat/agent/register.py +23 -0
- nat/agent/rewoo_agent/__init__.py +0 -0
- nat/agent/rewoo_agent/agent.py +593 -0
- nat/agent/rewoo_agent/prompt.py +107 -0
- nat/agent/rewoo_agent/register.py +175 -0
- nat/agent/tool_calling_agent/__init__.py +0 -0
- nat/agent/tool_calling_agent/agent.py +246 -0
- nat/agent/tool_calling_agent/register.py +129 -0
- nat/authentication/__init__.py +14 -0
- nat/authentication/api_key/__init__.py +14 -0
- nat/authentication/api_key/api_key_auth_provider.py +96 -0
- nat/authentication/api_key/api_key_auth_provider_config.py +124 -0
- nat/authentication/api_key/register.py +26 -0
- nat/authentication/credential_validator/__init__.py +14 -0
- nat/authentication/credential_validator/bearer_token_validator.py +557 -0
- nat/authentication/exceptions/__init__.py +14 -0
- nat/authentication/exceptions/api_key_exceptions.py +38 -0
- nat/authentication/http_basic_auth/__init__.py +0 -0
- nat/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- nat/authentication/http_basic_auth/register.py +30 -0
- nat/authentication/interfaces.py +96 -0
- nat/authentication/oauth2/__init__.py +14 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +140 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- nat/authentication/oauth2/oauth2_resource_server_config.py +124 -0
- nat/authentication/oauth2/register.py +25 -0
- nat/authentication/register.py +20 -0
- nat/builder/__init__.py +0 -0
- nat/builder/builder.py +317 -0
- nat/builder/component_utils.py +320 -0
- nat/builder/context.py +321 -0
- nat/builder/embedder.py +24 -0
- nat/builder/eval_builder.py +166 -0
- nat/builder/evaluator.py +29 -0
- nat/builder/framework_enum.py +25 -0
- nat/builder/front_end.py +73 -0
- nat/builder/function.py +714 -0
- nat/builder/function_base.py +380 -0
- nat/builder/function_info.py +625 -0
- nat/builder/intermediate_step_manager.py +206 -0
- nat/builder/llm.py +25 -0
- nat/builder/retriever.py +25 -0
- nat/builder/user_interaction_manager.py +78 -0
- nat/builder/workflow.py +160 -0
- nat/builder/workflow_builder.py +1365 -0
- nat/cli/__init__.py +14 -0
- nat/cli/cli_utils/__init__.py +0 -0
- nat/cli/cli_utils/config_override.py +231 -0
- nat/cli/cli_utils/validation.py +37 -0
- nat/cli/commands/__init__.py +0 -0
- nat/cli/commands/configure/__init__.py +0 -0
- nat/cli/commands/configure/channel/__init__.py +0 -0
- nat/cli/commands/configure/channel/add.py +28 -0
- nat/cli/commands/configure/channel/channel.py +34 -0
- nat/cli/commands/configure/channel/remove.py +30 -0
- nat/cli/commands/configure/channel/update.py +30 -0
- nat/cli/commands/configure/configure.py +33 -0
- nat/cli/commands/evaluate.py +139 -0
- nat/cli/commands/info/__init__.py +14 -0
- nat/cli/commands/info/info.py +47 -0
- nat/cli/commands/info/list_channels.py +32 -0
- nat/cli/commands/info/list_components.py +128 -0
- nat/cli/commands/mcp/__init__.py +14 -0
- nat/cli/commands/mcp/mcp.py +986 -0
- nat/cli/commands/object_store/__init__.py +14 -0
- nat/cli/commands/object_store/object_store.py +227 -0
- nat/cli/commands/optimize.py +90 -0
- nat/cli/commands/registry/__init__.py +14 -0
- nat/cli/commands/registry/publish.py +88 -0
- nat/cli/commands/registry/pull.py +118 -0
- nat/cli/commands/registry/registry.py +36 -0
- nat/cli/commands/registry/remove.py +108 -0
- nat/cli/commands/registry/search.py +153 -0
- nat/cli/commands/sizing/__init__.py +14 -0
- nat/cli/commands/sizing/calc.py +297 -0
- nat/cli/commands/sizing/sizing.py +27 -0
- nat/cli/commands/start.py +257 -0
- nat/cli/commands/uninstall.py +81 -0
- nat/cli/commands/validate.py +47 -0
- nat/cli/commands/workflow/__init__.py +14 -0
- nat/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- nat/cli/commands/workflow/templates/config.yml.j2 +17 -0
- nat/cli/commands/workflow/templates/pyproject.toml.j2 +25 -0
- nat/cli/commands/workflow/templates/register.py.j2 +4 -0
- nat/cli/commands/workflow/templates/workflow.py.j2 +50 -0
- nat/cli/commands/workflow/workflow.py +37 -0
- nat/cli/commands/workflow/workflow_commands.py +403 -0
- nat/cli/entrypoint.py +141 -0
- nat/cli/main.py +60 -0
- nat/cli/register_workflow.py +522 -0
- nat/cli/type_registry.py +1069 -0
- nat/control_flow/__init__.py +0 -0
- nat/control_flow/register.py +20 -0
- nat/control_flow/router_agent/__init__.py +0 -0
- nat/control_flow/router_agent/agent.py +329 -0
- nat/control_flow/router_agent/prompt.py +48 -0
- nat/control_flow/router_agent/register.py +91 -0
- nat/control_flow/sequential_executor.py +166 -0
- nat/data_models/__init__.py +14 -0
- nat/data_models/agent.py +34 -0
- nat/data_models/api_server.py +843 -0
- nat/data_models/authentication.py +245 -0
- nat/data_models/common.py +171 -0
- nat/data_models/component.py +60 -0
- nat/data_models/component_ref.py +179 -0
- nat/data_models/config.py +434 -0
- nat/data_models/dataset_handler.py +169 -0
- nat/data_models/discovery_metadata.py +305 -0
- nat/data_models/embedder.py +27 -0
- nat/data_models/evaluate.py +130 -0
- nat/data_models/evaluator.py +26 -0
- nat/data_models/front_end.py +26 -0
- nat/data_models/function.py +64 -0
- nat/data_models/function_dependencies.py +80 -0
- nat/data_models/gated_field_mixin.py +242 -0
- nat/data_models/interactive.py +246 -0
- nat/data_models/intermediate_step.py +302 -0
- nat/data_models/invocation_node.py +38 -0
- nat/data_models/llm.py +27 -0
- nat/data_models/logging.py +26 -0
- nat/data_models/memory.py +27 -0
- nat/data_models/object_store.py +44 -0
- nat/data_models/optimizable.py +119 -0
- nat/data_models/optimizer.py +149 -0
- nat/data_models/profiler.py +54 -0
- nat/data_models/registry_handler.py +26 -0
- nat/data_models/retriever.py +30 -0
- nat/data_models/retry_mixin.py +35 -0
- nat/data_models/span.py +228 -0
- nat/data_models/step_adaptor.py +64 -0
- nat/data_models/streaming.py +33 -0
- nat/data_models/swe_bench_model.py +54 -0
- nat/data_models/telemetry_exporter.py +26 -0
- nat/data_models/temperature_mixin.py +44 -0
- nat/data_models/thinking_mixin.py +86 -0
- nat/data_models/top_p_mixin.py +44 -0
- nat/data_models/ttc_strategy.py +30 -0
- nat/embedder/__init__.py +0 -0
- nat/embedder/azure_openai_embedder.py +46 -0
- nat/embedder/nim_embedder.py +59 -0
- nat/embedder/openai_embedder.py +42 -0
- nat/embedder/register.py +22 -0
- nat/eval/__init__.py +14 -0
- nat/eval/config.py +62 -0
- nat/eval/dataset_handler/__init__.py +0 -0
- nat/eval/dataset_handler/dataset_downloader.py +106 -0
- nat/eval/dataset_handler/dataset_filter.py +52 -0
- nat/eval/dataset_handler/dataset_handler.py +431 -0
- nat/eval/evaluate.py +565 -0
- nat/eval/evaluator/__init__.py +14 -0
- nat/eval/evaluator/base_evaluator.py +77 -0
- nat/eval/evaluator/evaluator_model.py +58 -0
- nat/eval/intermediate_step_adapter.py +99 -0
- nat/eval/rag_evaluator/__init__.py +0 -0
- nat/eval/rag_evaluator/evaluate.py +178 -0
- nat/eval/rag_evaluator/register.py +143 -0
- nat/eval/register.py +26 -0
- nat/eval/remote_workflow.py +133 -0
- nat/eval/runners/__init__.py +14 -0
- nat/eval/runners/config.py +39 -0
- nat/eval/runners/multi_eval_runner.py +54 -0
- nat/eval/runtime_evaluator/__init__.py +14 -0
- nat/eval/runtime_evaluator/evaluate.py +123 -0
- nat/eval/runtime_evaluator/register.py +100 -0
- nat/eval/runtime_event_subscriber.py +52 -0
- nat/eval/swe_bench_evaluator/__init__.py +0 -0
- nat/eval/swe_bench_evaluator/evaluate.py +215 -0
- nat/eval/swe_bench_evaluator/register.py +36 -0
- nat/eval/trajectory_evaluator/__init__.py +0 -0
- nat/eval/trajectory_evaluator/evaluate.py +75 -0
- nat/eval/trajectory_evaluator/register.py +40 -0
- nat/eval/tunable_rag_evaluator/__init__.py +0 -0
- nat/eval/tunable_rag_evaluator/evaluate.py +242 -0
- nat/eval/tunable_rag_evaluator/register.py +52 -0
- nat/eval/usage_stats.py +41 -0
- nat/eval/utils/__init__.py +0 -0
- nat/eval/utils/eval_trace_ctx.py +89 -0
- nat/eval/utils/output_uploader.py +140 -0
- nat/eval/utils/tqdm_position_registry.py +40 -0
- nat/eval/utils/weave_eval.py +193 -0
- nat/experimental/__init__.py +0 -0
- nat/experimental/decorators/__init__.py +0 -0
- nat/experimental/decorators/experimental_warning_decorator.py +154 -0
- nat/experimental/test_time_compute/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- nat/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- nat/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- nat/experimental/test_time_compute/functions/__init__.py +0 -0
- nat/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- nat/experimental/test_time_compute/functions/plan_select_execute_function.py +228 -0
- nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +205 -0
- nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +146 -0
- nat/experimental/test_time_compute/models/__init__.py +0 -0
- nat/experimental/test_time_compute/models/editor_config.py +132 -0
- nat/experimental/test_time_compute/models/scoring_config.py +112 -0
- nat/experimental/test_time_compute/models/search_config.py +120 -0
- nat/experimental/test_time_compute/models/selection_config.py +154 -0
- nat/experimental/test_time_compute/models/stage_enums.py +43 -0
- nat/experimental/test_time_compute/models/strategy_base.py +67 -0
- nat/experimental/test_time_compute/models/tool_use_config.py +41 -0
- nat/experimental/test_time_compute/models/ttc_item.py +48 -0
- nat/experimental/test_time_compute/register.py +35 -0
- nat/experimental/test_time_compute/scoring/__init__.py +0 -0
- nat/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- nat/experimental/test_time_compute/search/__init__.py +0 -0
- nat/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- nat/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- nat/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- nat/experimental/test_time_compute/selection/__init__.py +0 -0
- nat/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- nat/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +157 -0
- nat/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- nat/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- nat/front_ends/__init__.py +14 -0
- nat/front_ends/console/__init__.py +14 -0
- nat/front_ends/console/authentication_flow_handler.py +285 -0
- nat/front_ends/console/console_front_end_config.py +32 -0
- nat/front_ends/console/console_front_end_plugin.py +108 -0
- nat/front_ends/console/register.py +25 -0
- nat/front_ends/cron/__init__.py +14 -0
- nat/front_ends/fastapi/__init__.py +14 -0
- nat/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +142 -0
- nat/front_ends/fastapi/dask_client_mixin.py +65 -0
- nat/front_ends/fastapi/fastapi_front_end_config.py +272 -0
- nat/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin.py +247 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1257 -0
- nat/front_ends/fastapi/html_snippets/__init__.py +14 -0
- nat/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- nat/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- nat/front_ends/fastapi/job_store.py +602 -0
- nat/front_ends/fastapi/main.py +64 -0
- nat/front_ends/fastapi/message_handler.py +344 -0
- nat/front_ends/fastapi/message_validator.py +351 -0
- nat/front_ends/fastapi/register.py +25 -0
- nat/front_ends/fastapi/response_helpers.py +195 -0
- nat/front_ends/fastapi/step_adaptor.py +319 -0
- nat/front_ends/fastapi/utils.py +57 -0
- nat/front_ends/mcp/__init__.py +14 -0
- nat/front_ends/mcp/introspection_token_verifier.py +73 -0
- nat/front_ends/mcp/mcp_front_end_config.py +90 -0
- nat/front_ends/mcp/mcp_front_end_plugin.py +113 -0
- nat/front_ends/mcp/mcp_front_end_plugin_worker.py +268 -0
- nat/front_ends/mcp/memory_profiler.py +320 -0
- nat/front_ends/mcp/register.py +27 -0
- nat/front_ends/mcp/tool_converter.py +290 -0
- nat/front_ends/register.py +21 -0
- nat/front_ends/simple_base/__init__.py +14 -0
- nat/front_ends/simple_base/simple_front_end_plugin_base.py +56 -0
- nat/llm/__init__.py +0 -0
- nat/llm/aws_bedrock_llm.py +69 -0
- nat/llm/azure_openai_llm.py +57 -0
- nat/llm/litellm_llm.py +69 -0
- nat/llm/nim_llm.py +58 -0
- nat/llm/openai_llm.py +54 -0
- nat/llm/register.py +27 -0
- nat/llm/utils/__init__.py +14 -0
- nat/llm/utils/env_config_value.py +93 -0
- nat/llm/utils/error.py +17 -0
- nat/llm/utils/thinking.py +215 -0
- nat/memory/__init__.py +20 -0
- nat/memory/interfaces.py +183 -0
- nat/memory/models.py +112 -0
- nat/meta/pypi.md +58 -0
- nat/object_store/__init__.py +20 -0
- nat/object_store/in_memory_object_store.py +76 -0
- nat/object_store/interfaces.py +84 -0
- nat/object_store/models.py +38 -0
- nat/object_store/register.py +19 -0
- nat/observability/__init__.py +14 -0
- nat/observability/exporter/__init__.py +14 -0
- nat/observability/exporter/base_exporter.py +449 -0
- nat/observability/exporter/exporter.py +78 -0
- nat/observability/exporter/file_exporter.py +33 -0
- nat/observability/exporter/processing_exporter.py +550 -0
- nat/observability/exporter/raw_exporter.py +52 -0
- nat/observability/exporter/span_exporter.py +308 -0
- nat/observability/exporter_manager.py +335 -0
- nat/observability/mixin/__init__.py +14 -0
- nat/observability/mixin/batch_config_mixin.py +26 -0
- nat/observability/mixin/collector_config_mixin.py +23 -0
- nat/observability/mixin/file_mixin.py +288 -0
- nat/observability/mixin/file_mode.py +23 -0
- nat/observability/mixin/redaction_config_mixin.py +42 -0
- nat/observability/mixin/resource_conflict_mixin.py +134 -0
- nat/observability/mixin/serialize_mixin.py +61 -0
- nat/observability/mixin/tagging_config_mixin.py +62 -0
- nat/observability/mixin/type_introspection_mixin.py +496 -0
- nat/observability/processor/__init__.py +14 -0
- nat/observability/processor/batching_processor.py +308 -0
- nat/observability/processor/callback_processor.py +42 -0
- nat/observability/processor/falsy_batch_filter_processor.py +55 -0
- nat/observability/processor/intermediate_step_serializer.py +28 -0
- nat/observability/processor/processor.py +74 -0
- nat/observability/processor/processor_factory.py +70 -0
- nat/observability/processor/redaction/__init__.py +24 -0
- nat/observability/processor/redaction/contextual_redaction_processor.py +125 -0
- nat/observability/processor/redaction/contextual_span_redaction_processor.py +66 -0
- nat/observability/processor/redaction/redaction_processor.py +177 -0
- nat/observability/processor/redaction/span_header_redaction_processor.py +92 -0
- nat/observability/processor/span_tagging_processor.py +68 -0
- nat/observability/register.py +114 -0
- nat/observability/utils/__init__.py +14 -0
- nat/observability/utils/dict_utils.py +236 -0
- nat/observability/utils/time_utils.py +31 -0
- nat/plugins/.namespace +1 -0
- nat/profiler/__init__.py +0 -0
- nat/profiler/calc/__init__.py +14 -0
- nat/profiler/calc/calc_runner.py +626 -0
- nat/profiler/calc/calculations.py +288 -0
- nat/profiler/calc/data_models.py +188 -0
- nat/profiler/calc/plot.py +345 -0
- nat/profiler/callbacks/__init__.py +0 -0
- nat/profiler/callbacks/agno_callback_handler.py +295 -0
- nat/profiler/callbacks/base_callback_class.py +20 -0
- nat/profiler/callbacks/langchain_callback_handler.py +297 -0
- nat/profiler/callbacks/llama_index_callback_handler.py +205 -0
- nat/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- nat/profiler/callbacks/token_usage_base_model.py +27 -0
- nat/profiler/data_frame_row.py +51 -0
- nat/profiler/data_models.py +24 -0
- nat/profiler/decorators/__init__.py +0 -0
- nat/profiler/decorators/framework_wrapper.py +180 -0
- nat/profiler/decorators/function_tracking.py +411 -0
- nat/profiler/forecasting/__init__.py +0 -0
- nat/profiler/forecasting/config.py +18 -0
- nat/profiler/forecasting/model_trainer.py +75 -0
- nat/profiler/forecasting/models/__init__.py +22 -0
- nat/profiler/forecasting/models/forecasting_base_model.py +42 -0
- nat/profiler/forecasting/models/linear_model.py +197 -0
- nat/profiler/forecasting/models/random_forest_regressor.py +269 -0
- nat/profiler/inference_metrics_model.py +28 -0
- nat/profiler/inference_optimization/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- nat/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- nat/profiler/inference_optimization/data_models.py +386 -0
- nat/profiler/inference_optimization/experimental/__init__.py +0 -0
- nat/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +404 -0
- nat/profiler/inference_optimization/llm_metrics.py +212 -0
- nat/profiler/inference_optimization/prompt_caching.py +163 -0
- nat/profiler/inference_optimization/token_uniqueness.py +107 -0
- nat/profiler/inference_optimization/workflow_runtimes.py +72 -0
- nat/profiler/intermediate_property_adapter.py +102 -0
- nat/profiler/parameter_optimization/__init__.py +0 -0
- nat/profiler/parameter_optimization/optimizable_utils.py +93 -0
- nat/profiler/parameter_optimization/optimizer_runtime.py +67 -0
- nat/profiler/parameter_optimization/parameter_optimizer.py +153 -0
- nat/profiler/parameter_optimization/parameter_selection.py +107 -0
- nat/profiler/parameter_optimization/pareto_visualizer.py +380 -0
- nat/profiler/parameter_optimization/prompt_optimizer.py +384 -0
- nat/profiler/parameter_optimization/update_helpers.py +66 -0
- nat/profiler/profile_runner.py +478 -0
- nat/profiler/utils.py +186 -0
- nat/registry_handlers/__init__.py +0 -0
- nat/registry_handlers/local/__init__.py +0 -0
- nat/registry_handlers/local/local_handler.py +176 -0
- nat/registry_handlers/local/register_local.py +37 -0
- nat/registry_handlers/metadata_factory.py +60 -0
- nat/registry_handlers/package_utils.py +570 -0
- nat/registry_handlers/pypi/__init__.py +0 -0
- nat/registry_handlers/pypi/pypi_handler.py +248 -0
- nat/registry_handlers/pypi/register_pypi.py +40 -0
- nat/registry_handlers/register.py +20 -0
- nat/registry_handlers/registry_handler_base.py +157 -0
- nat/registry_handlers/rest/__init__.py +0 -0
- nat/registry_handlers/rest/register_rest.py +56 -0
- nat/registry_handlers/rest/rest_handler.py +236 -0
- nat/registry_handlers/schemas/__init__.py +0 -0
- nat/registry_handlers/schemas/headers.py +42 -0
- nat/registry_handlers/schemas/package.py +68 -0
- nat/registry_handlers/schemas/publish.py +68 -0
- nat/registry_handlers/schemas/pull.py +82 -0
- nat/registry_handlers/schemas/remove.py +36 -0
- nat/registry_handlers/schemas/search.py +91 -0
- nat/registry_handlers/schemas/status.py +47 -0
- nat/retriever/__init__.py +0 -0
- nat/retriever/interface.py +41 -0
- nat/retriever/milvus/__init__.py +14 -0
- nat/retriever/milvus/register.py +81 -0
- nat/retriever/milvus/retriever.py +228 -0
- nat/retriever/models.py +77 -0
- nat/retriever/nemo_retriever/__init__.py +14 -0
- nat/retriever/nemo_retriever/register.py +60 -0
- nat/retriever/nemo_retriever/retriever.py +190 -0
- nat/retriever/register.py +21 -0
- nat/runtime/__init__.py +14 -0
- nat/runtime/loader.py +220 -0
- nat/runtime/runner.py +292 -0
- nat/runtime/session.py +223 -0
- nat/runtime/user_metadata.py +130 -0
- nat/settings/__init__.py +0 -0
- nat/settings/global_settings.py +329 -0
- nat/test/.namespace +1 -0
- nat/tool/__init__.py +0 -0
- nat/tool/chat_completion.py +77 -0
- nat/tool/code_execution/README.md +151 -0
- nat/tool/code_execution/__init__.py +0 -0
- nat/tool/code_execution/code_sandbox.py +267 -0
- nat/tool/code_execution/local_sandbox/.gitignore +1 -0
- nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- nat/tool/code_execution/local_sandbox/__init__.py +13 -0
- nat/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- nat/tool/code_execution/register.py +74 -0
- nat/tool/code_execution/test_code_execution_sandbox.py +414 -0
- nat/tool/code_execution/utils.py +100 -0
- nat/tool/datetime_tools.py +82 -0
- nat/tool/document_search.py +141 -0
- nat/tool/github_tools.py +450 -0
- nat/tool/memory_tools/__init__.py +0 -0
- nat/tool/memory_tools/add_memory_tool.py +79 -0
- nat/tool/memory_tools/delete_memory_tool.py +66 -0
- nat/tool/memory_tools/get_memory_tool.py +72 -0
- nat/tool/nvidia_rag.py +95 -0
- nat/tool/register.py +31 -0
- nat/tool/retriever.py +95 -0
- nat/tool/server_tools.py +66 -0
- nat/utils/__init__.py +0 -0
- nat/utils/callable_utils.py +70 -0
- nat/utils/data_models/__init__.py +0 -0
- nat/utils/data_models/schema_validator.py +58 -0
- nat/utils/debugging_utils.py +43 -0
- nat/utils/decorators.py +210 -0
- nat/utils/dump_distro_mapping.py +32 -0
- nat/utils/exception_handlers/__init__.py +0 -0
- nat/utils/exception_handlers/automatic_retries.py +342 -0
- nat/utils/exception_handlers/schemas.py +114 -0
- nat/utils/io/__init__.py +0 -0
- nat/utils/io/model_processing.py +28 -0
- nat/utils/io/yaml_tools.py +119 -0
- nat/utils/log_levels.py +25 -0
- nat/utils/log_utils.py +37 -0
- nat/utils/metadata_utils.py +74 -0
- nat/utils/optional_imports.py +142 -0
- nat/utils/producer_consumer_queue.py +178 -0
- nat/utils/reactive/__init__.py +0 -0
- nat/utils/reactive/base/__init__.py +0 -0
- nat/utils/reactive/base/observable_base.py +65 -0
- nat/utils/reactive/base/observer_base.py +55 -0
- nat/utils/reactive/base/subject_base.py +79 -0
- nat/utils/reactive/observable.py +59 -0
- nat/utils/reactive/observer.py +76 -0
- nat/utils/reactive/subject.py +131 -0
- nat/utils/reactive/subscription.py +49 -0
- nat/utils/settings/__init__.py +0 -0
- nat/utils/settings/global_settings.py +195 -0
- nat/utils/string_utils.py +38 -0
- nat/utils/type_converter.py +299 -0
- nat/utils/type_utils.py +488 -0
- nat/utils/url_utils.py +27 -0
- nvidia_nat-1.1.0a20251020.dist-info/METADATA +195 -0
- nvidia_nat-1.1.0a20251020.dist-info/RECORD +480 -0
- nvidia_nat-1.1.0a20251020.dist-info/WHEEL +5 -0
- nvidia_nat-1.1.0a20251020.dist-info/entry_points.txt +22 -0
- nvidia_nat-1.1.0a20251020.dist-info/licenses/LICENSE-3rd-party.txt +5478 -0
- nvidia_nat-1.1.0a20251020.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.1.0a20251020.dist-info/top_level.txt +2 -0
|
@@ -0,0 +1,107 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
PLANNER_SYSTEM_PROMPT = """
|
|
17
|
+
For the following task, make plans that can solve the problem step by step. For each plan, indicate \
|
|
18
|
+
which external tool together with tool input to retrieve evidence. You can store the evidence into a \
|
|
19
|
+
placeholder #E that can be called by later tools. (Plan, #E1, Plan, #E2, Plan, ...)
|
|
20
|
+
|
|
21
|
+
The following tools and respective requirements are available to you:
|
|
22
|
+
|
|
23
|
+
{tools}
|
|
24
|
+
|
|
25
|
+
The tool calls you make should be one of the following: [{tool_names}]
|
|
26
|
+
|
|
27
|
+
You are not required to use all the tools listed. Choose only the ones that best fit the needs of each plan step.
|
|
28
|
+
|
|
29
|
+
Your output must be a JSON array where each element represents one planning step. Each step must be an object with \
|
|
30
|
+
exactly two keys:
|
|
31
|
+
|
|
32
|
+
1. "plan": A string that describes in detail the action or reasoning for that step.
|
|
33
|
+
|
|
34
|
+
2. "evidence": An object representing the external tool call associated with that plan step. This object must have the \
|
|
35
|
+
following keys:
|
|
36
|
+
|
|
37
|
+
-"placeholder": A string that identifies the evidence placeholder ("#E1", "#E2", ...). The numbering should \
|
|
38
|
+
be sequential based on the order of steps.
|
|
39
|
+
|
|
40
|
+
-"tool": A string specifying the name of the external tool used.
|
|
41
|
+
|
|
42
|
+
-"tool_input": The input to the tool. This can be a string, array, or object, depending on the requirements of the \
|
|
43
|
+
tool. Be careful about type assumptions because the output of former tools might contain noise.
|
|
44
|
+
|
|
45
|
+
Important instructions:
|
|
46
|
+
|
|
47
|
+
Do not output any additional text, comments, or markdown formatting.
|
|
48
|
+
|
|
49
|
+
Do not include any explanation or reasoning text outside of the JSON array.
|
|
50
|
+
|
|
51
|
+
The output must be a valid JSON array that can be parsed directly.
|
|
52
|
+
|
|
53
|
+
Here is an example of how a valid JSON output should look:
|
|
54
|
+
|
|
55
|
+
[
|
|
56
|
+
\'{{
|
|
57
|
+
"plan": "Find Alex's schedule on Sep 25, 2025",
|
|
58
|
+
"evidence": \'{{
|
|
59
|
+
"placeholder": "#E1",
|
|
60
|
+
"tool": "search_calendar",
|
|
61
|
+
"tool_input": ("Alex", "09/25/2025")
|
|
62
|
+
}}\'
|
|
63
|
+
}}\',
|
|
64
|
+
\'{{
|
|
65
|
+
"plan": "Find Bill's schedule on sep 25, 2025",
|
|
66
|
+
"evidence": \'{{
|
|
67
|
+
"placeholder": "#E2",
|
|
68
|
+
"tool": "search_calendar",
|
|
69
|
+
"tool_input": ("Bill", "09/25/2025")
|
|
70
|
+
}}\'
|
|
71
|
+
}}\',
|
|
72
|
+
\'{{
|
|
73
|
+
"plan": "Suggest a time for 1-hour meeting given Alex's and Bill's schedule.",
|
|
74
|
+
"evidence": \'{{
|
|
75
|
+
"placeholder": "#E3",
|
|
76
|
+
"tool": "llm_chat",
|
|
77
|
+
"tool_input": "Find a common 1-hour time slot for Alex and Bill given their schedules. \
|
|
78
|
+
Alex's schedule: #E1; Bill's schedule: #E2?"
|
|
79
|
+
}}\'
|
|
80
|
+
}}\'
|
|
81
|
+
]
|
|
82
|
+
|
|
83
|
+
Begin!
|
|
84
|
+
"""
|
|
85
|
+
|
|
86
|
+
PLANNER_USER_PROMPT = """
|
|
87
|
+
Previous conversation history:
|
|
88
|
+
{chat_history}
|
|
89
|
+
|
|
90
|
+
task: {task}
|
|
91
|
+
"""
|
|
92
|
+
|
|
93
|
+
SOLVER_SYSTEM_PROMPT = """
|
|
94
|
+
Solve the following task or problem. To solve the problem, we have made some Plans ahead and \
|
|
95
|
+
retrieved corresponding Evidence to each Plan. Use them with caution since long evidence might \
|
|
96
|
+
contain irrelevant information.
|
|
97
|
+
|
|
98
|
+
Now solve the question or task according to provided Evidence above. Respond with the answer
|
|
99
|
+
directly with no extra words.
|
|
100
|
+
|
|
101
|
+
"""
|
|
102
|
+
SOLVER_USER_PROMPT = """
|
|
103
|
+
plan: {plan}
|
|
104
|
+
task: {task}
|
|
105
|
+
|
|
106
|
+
Response:
|
|
107
|
+
"""
|
|
@@ -0,0 +1,175 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from pydantic import AliasChoices
|
|
19
|
+
from pydantic import Field
|
|
20
|
+
from pydantic import PositiveInt
|
|
21
|
+
|
|
22
|
+
from nat.builder.builder import Builder
|
|
23
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
24
|
+
from nat.builder.function_info import FunctionInfo
|
|
25
|
+
from nat.cli.register_workflow import register_function
|
|
26
|
+
from nat.data_models.agent import AgentBaseConfig
|
|
27
|
+
from nat.data_models.api_server import ChatRequest
|
|
28
|
+
from nat.data_models.api_server import ChatRequestOrMessage
|
|
29
|
+
from nat.data_models.api_server import ChatResponse
|
|
30
|
+
from nat.data_models.api_server import Usage
|
|
31
|
+
from nat.data_models.component_ref import FunctionGroupRef
|
|
32
|
+
from nat.data_models.component_ref import FunctionRef
|
|
33
|
+
from nat.utils.type_converter import GlobalTypeConverter
|
|
34
|
+
|
|
35
|
+
logger = logging.getLogger(__name__)
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
class ReWOOAgentWorkflowConfig(AgentBaseConfig, name="rewoo_agent"):
|
|
39
|
+
"""
|
|
40
|
+
Defines a NAT function that uses a ReWOO Agent performs reasoning inbetween tool calls, and utilizes the
|
|
41
|
+
tool names and descriptions to select the optimal tool.
|
|
42
|
+
"""
|
|
43
|
+
description: str = Field(default="ReWOO Agent Workflow", description="The description of this functions use.")
|
|
44
|
+
tool_names: list[FunctionRef | FunctionGroupRef] = Field(
|
|
45
|
+
default_factory=list, description="The list of tools to provide to the rewoo agent.")
|
|
46
|
+
include_tool_input_schema_in_tool_description: bool = Field(
|
|
47
|
+
default=True, description="Specify inclusion of tool input schemas in the prompt.")
|
|
48
|
+
planner_prompt: str | None = Field(
|
|
49
|
+
default=None,
|
|
50
|
+
description="Provides the PLANNER_PROMPT to use with the agent") # defaults to PLANNER_PROMPT in prompt.py
|
|
51
|
+
solver_prompt: str | None = Field(
|
|
52
|
+
default=None,
|
|
53
|
+
description="Provides the SOLVER_PROMPT to use with the agent") # defaults to SOLVER_PROMPT in prompt.py
|
|
54
|
+
tool_call_max_retries: PositiveInt = Field(default=3,
|
|
55
|
+
description="The number of retries before raising a tool call error.",
|
|
56
|
+
ge=1)
|
|
57
|
+
max_history: int = Field(default=15, description="Maximum number of messages to keep in the conversation history.")
|
|
58
|
+
additional_planner_instructions: str | None = Field(
|
|
59
|
+
default=None,
|
|
60
|
+
validation_alias=AliasChoices("additional_planner_instructions", "additional_instructions"),
|
|
61
|
+
description="Additional instructions to provide to the agent in addition to the base planner prompt.")
|
|
62
|
+
additional_solver_instructions: str | None = Field(
|
|
63
|
+
default=None,
|
|
64
|
+
description="Additional instructions to provide to the agent in addition to the base solver prompt.")
|
|
65
|
+
raise_tool_call_error: bool = Field(default=True,
|
|
66
|
+
description="Whether to raise a exception immediately if a tool"
|
|
67
|
+
"call fails. If set to False, the tool call error message will be included in"
|
|
68
|
+
"the tool response and passed to the next tool.")
|
|
69
|
+
|
|
70
|
+
|
|
71
|
+
@register_function(config_type=ReWOOAgentWorkflowConfig, framework_wrappers=[LLMFrameworkEnum.LANGCHAIN])
|
|
72
|
+
async def rewoo_agent_workflow(config: ReWOOAgentWorkflowConfig, builder: Builder):
|
|
73
|
+
from langchain_core.messages import trim_messages
|
|
74
|
+
from langchain_core.messages.base import BaseMessage
|
|
75
|
+
from langchain_core.messages.human import HumanMessage
|
|
76
|
+
from langchain_core.prompts import ChatPromptTemplate
|
|
77
|
+
from langgraph.graph.state import CompiledStateGraph
|
|
78
|
+
|
|
79
|
+
from nat.agent.rewoo_agent.prompt import PLANNER_SYSTEM_PROMPT
|
|
80
|
+
from nat.agent.rewoo_agent.prompt import PLANNER_USER_PROMPT
|
|
81
|
+
from nat.agent.rewoo_agent.prompt import SOLVER_SYSTEM_PROMPT
|
|
82
|
+
from nat.agent.rewoo_agent.prompt import SOLVER_USER_PROMPT
|
|
83
|
+
|
|
84
|
+
from .agent import ReWOOAgentGraph
|
|
85
|
+
from .agent import ReWOOGraphState
|
|
86
|
+
|
|
87
|
+
# the ReWOO Agent prompts are defined in prompt.py, and can be customized there or by modifying the config option
|
|
88
|
+
# planner_prompt and solver_prompt.
|
|
89
|
+
planner_system_prompt = PLANNER_SYSTEM_PROMPT if config.planner_prompt is None else config.planner_prompt
|
|
90
|
+
if config.additional_planner_instructions:
|
|
91
|
+
planner_system_prompt += f"{config.additional_planner_instructions}"
|
|
92
|
+
if not ReWOOAgentGraph.validate_planner_prompt(planner_system_prompt):
|
|
93
|
+
logger.error("Invalid planner prompt")
|
|
94
|
+
raise ValueError("Invalid planner prompt")
|
|
95
|
+
planner_prompt = ChatPromptTemplate([("system", planner_system_prompt), ("user", PLANNER_USER_PROMPT)])
|
|
96
|
+
|
|
97
|
+
solver_system_prompt = SOLVER_SYSTEM_PROMPT if config.solver_prompt is None else config.solver_prompt
|
|
98
|
+
if config.additional_solver_instructions:
|
|
99
|
+
solver_system_prompt += f"{config.additional_solver_instructions}"
|
|
100
|
+
if not ReWOOAgentGraph.validate_solver_prompt(solver_system_prompt):
|
|
101
|
+
logger.error("Invalid solver prompt")
|
|
102
|
+
raise ValueError("Invalid solver prompt")
|
|
103
|
+
solver_prompt = ChatPromptTemplate([("system", solver_system_prompt), ("user", SOLVER_USER_PROMPT)])
|
|
104
|
+
|
|
105
|
+
# we can choose an LLM for the ReWOO agent in the config file
|
|
106
|
+
llm = await builder.get_llm(config.llm_name, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
107
|
+
|
|
108
|
+
# the agent can run any installed tool, simply install the tool and add it to the config file
|
|
109
|
+
# the sample tool provided can easily be copied or changed
|
|
110
|
+
tools = await builder.get_tools(tool_names=config.tool_names, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
111
|
+
if not tools:
|
|
112
|
+
raise ValueError(f"No tools specified for ReWOO Agent '{config.llm_name}'")
|
|
113
|
+
|
|
114
|
+
# construct the ReWOO Agent Graph from the configured llm, prompt, and tools
|
|
115
|
+
graph: CompiledStateGraph = await ReWOOAgentGraph(
|
|
116
|
+
llm=llm,
|
|
117
|
+
planner_prompt=planner_prompt,
|
|
118
|
+
solver_prompt=solver_prompt,
|
|
119
|
+
tools=tools,
|
|
120
|
+
use_tool_schema=config.include_tool_input_schema_in_tool_description,
|
|
121
|
+
detailed_logs=config.verbose,
|
|
122
|
+
log_response_max_chars=config.log_response_max_chars,
|
|
123
|
+
tool_call_max_retries=config.tool_call_max_retries,
|
|
124
|
+
raise_tool_call_error=config.raise_tool_call_error).build_graph()
|
|
125
|
+
|
|
126
|
+
async def _response_fn(chat_request_or_message: ChatRequestOrMessage) -> ChatResponse | str:
|
|
127
|
+
"""
|
|
128
|
+
Main workflow entry function for the ReWOO Agent.
|
|
129
|
+
|
|
130
|
+
This function invokes the ReWOO Agent Graph and returns the response.
|
|
131
|
+
|
|
132
|
+
Args:
|
|
133
|
+
chat_request_or_message (ChatRequestOrMessage): The input message to process
|
|
134
|
+
|
|
135
|
+
Returns:
|
|
136
|
+
ChatResponse | str: The response from the agent or error message
|
|
137
|
+
"""
|
|
138
|
+
try:
|
|
139
|
+
message = GlobalTypeConverter.get().convert(chat_request_or_message, to_type=ChatRequest)
|
|
140
|
+
|
|
141
|
+
# initialize the starting state with the user query
|
|
142
|
+
messages: list[BaseMessage] = trim_messages(messages=[m.model_dump() for m in message.messages],
|
|
143
|
+
max_tokens=config.max_history,
|
|
144
|
+
strategy="last",
|
|
145
|
+
token_counter=len,
|
|
146
|
+
start_on="human",
|
|
147
|
+
include_system=True)
|
|
148
|
+
|
|
149
|
+
task = HumanMessage(content=messages[-1].content)
|
|
150
|
+
state = ReWOOGraphState(messages=messages, task=task)
|
|
151
|
+
|
|
152
|
+
# run the ReWOO Agent Graph
|
|
153
|
+
state = await graph.ainvoke(state)
|
|
154
|
+
|
|
155
|
+
# get and return the output from the state
|
|
156
|
+
state = ReWOOGraphState(**state)
|
|
157
|
+
output_message = state.result.content
|
|
158
|
+
# Ensure output_message is a string
|
|
159
|
+
if isinstance(output_message, list | dict):
|
|
160
|
+
output_message = str(output_message)
|
|
161
|
+
|
|
162
|
+
# Create usage statistics for the response
|
|
163
|
+
prompt_tokens = sum(len(str(msg.content).split()) for msg in message.messages)
|
|
164
|
+
completion_tokens = len(output_message.split()) if output_message else 0
|
|
165
|
+
total_tokens = prompt_tokens + completion_tokens
|
|
166
|
+
usage = Usage(prompt_tokens=prompt_tokens, completion_tokens=completion_tokens, total_tokens=total_tokens)
|
|
167
|
+
response = ChatResponse.from_string(output_message, usage=usage)
|
|
168
|
+
if chat_request_or_message.is_string:
|
|
169
|
+
return GlobalTypeConverter.get().convert(response, to_type=str)
|
|
170
|
+
return response
|
|
171
|
+
except Exception as ex:
|
|
172
|
+
logger.error("ReWOO Agent failed with exception: %s", ex)
|
|
173
|
+
raise
|
|
174
|
+
|
|
175
|
+
yield FunctionInfo.from_fn(_response_fn, description=config.description)
|
|
File without changes
|
|
@@ -0,0 +1,246 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
import typing
|
|
18
|
+
|
|
19
|
+
from langchain_core.callbacks.base import AsyncCallbackHandler
|
|
20
|
+
from langchain_core.language_models import BaseChatModel
|
|
21
|
+
from langchain_core.messages import SystemMessage
|
|
22
|
+
from langchain_core.messages import ToolMessage
|
|
23
|
+
from langchain_core.messages.base import BaseMessage
|
|
24
|
+
from langchain_core.runnables import RunnableLambda
|
|
25
|
+
from langchain_core.runnables.config import RunnableConfig
|
|
26
|
+
from langchain_core.tools import BaseTool
|
|
27
|
+
from langgraph.graph import StateGraph
|
|
28
|
+
from langgraph.graph.state import CompiledStateGraph
|
|
29
|
+
from langgraph.prebuilt import ToolNode
|
|
30
|
+
from pydantic import BaseModel
|
|
31
|
+
from pydantic import Field
|
|
32
|
+
|
|
33
|
+
from nat.agent.base import AGENT_CALL_LOG_MESSAGE
|
|
34
|
+
from nat.agent.base import AGENT_LOG_PREFIX
|
|
35
|
+
from nat.agent.base import AgentDecision
|
|
36
|
+
from nat.agent.dual_node import DualNodeAgent
|
|
37
|
+
|
|
38
|
+
if typing.TYPE_CHECKING:
|
|
39
|
+
from nat.agent.tool_calling_agent.register import ToolCallAgentWorkflowConfig
|
|
40
|
+
|
|
41
|
+
logger = logging.getLogger(__name__)
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
class ToolCallAgentGraphState(BaseModel):
|
|
45
|
+
"""State schema for the Tool Calling Agent Graph"""
|
|
46
|
+
messages: list[BaseMessage] = Field(default_factory=list) # input and output of the Agent
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
class ToolCallAgentGraph(DualNodeAgent):
|
|
50
|
+
"""Configurable LangGraph Tool Calling Agent. A Tool Calling Agent requires an LLM which supports tool calling.
|
|
51
|
+
A tool Calling Agent utilizes the tool input parameters to select the optimal tool. Supports handling tool errors.
|
|
52
|
+
Argument "detailed_logs" toggles logging of inputs, outputs, and intermediate steps."""
|
|
53
|
+
|
|
54
|
+
def __init__(
|
|
55
|
+
self,
|
|
56
|
+
llm: BaseChatModel,
|
|
57
|
+
tools: list[BaseTool],
|
|
58
|
+
prompt: str | None = None,
|
|
59
|
+
callbacks: list[AsyncCallbackHandler] = None,
|
|
60
|
+
detailed_logs: bool = False,
|
|
61
|
+
log_response_max_chars: int = 1000,
|
|
62
|
+
handle_tool_errors: bool = True,
|
|
63
|
+
return_direct: list[BaseTool] | None = None,
|
|
64
|
+
):
|
|
65
|
+
super().__init__(llm=llm,
|
|
66
|
+
tools=tools,
|
|
67
|
+
callbacks=callbacks,
|
|
68
|
+
detailed_logs=detailed_logs,
|
|
69
|
+
log_response_max_chars=log_response_max_chars)
|
|
70
|
+
|
|
71
|
+
# some LLMs support tool calling
|
|
72
|
+
# these models accept the tool's input schema and decide when to use a tool based on the input's relevance
|
|
73
|
+
try:
|
|
74
|
+
# in tool calling agents, we bind the tools to the LLM, to pass the tools' input schemas at runtime
|
|
75
|
+
self.bound_llm = llm.bind_tools(tools)
|
|
76
|
+
except NotImplementedError as ex:
|
|
77
|
+
logger.error("%s Failed to bind tools: %s", AGENT_LOG_PREFIX, ex)
|
|
78
|
+
raise
|
|
79
|
+
|
|
80
|
+
if prompt is not None:
|
|
81
|
+
system_prompt = SystemMessage(content=prompt)
|
|
82
|
+
prompt_runnable = RunnableLambda(
|
|
83
|
+
lambda state: [system_prompt] + state.get("messages", []),
|
|
84
|
+
name="SystemPrompt",
|
|
85
|
+
)
|
|
86
|
+
else:
|
|
87
|
+
prompt_runnable = RunnableLambda(
|
|
88
|
+
lambda state: state.get("messages", []),
|
|
89
|
+
name="PromptPassthrough",
|
|
90
|
+
)
|
|
91
|
+
|
|
92
|
+
self.agent = prompt_runnable | self.bound_llm
|
|
93
|
+
self.tool_caller = ToolNode(tools, handle_tool_errors=handle_tool_errors)
|
|
94
|
+
self.return_direct = [tool.name for tool in return_direct] if return_direct else []
|
|
95
|
+
logger.debug("%s Initialized Tool Calling Agent Graph", AGENT_LOG_PREFIX)
|
|
96
|
+
|
|
97
|
+
async def agent_node(self, state: ToolCallAgentGraphState):
|
|
98
|
+
try:
|
|
99
|
+
logger.debug("%s Starting the Tool Calling Agent Node", AGENT_LOG_PREFIX)
|
|
100
|
+
if len(state.messages) == 0:
|
|
101
|
+
raise RuntimeError('No input received in state: "messages"')
|
|
102
|
+
response = await self.agent.ainvoke(
|
|
103
|
+
{"messages": state.messages},
|
|
104
|
+
config=RunnableConfig(callbacks=self.callbacks),
|
|
105
|
+
)
|
|
106
|
+
if self.detailed_logs:
|
|
107
|
+
agent_input = "\n".join(str(message.content) for message in state.messages)
|
|
108
|
+
logger.info(AGENT_CALL_LOG_MESSAGE, agent_input, response)
|
|
109
|
+
|
|
110
|
+
state.messages += [response]
|
|
111
|
+
return state
|
|
112
|
+
except Exception as ex:
|
|
113
|
+
logger.error("%s Failed to call agent_node: %s", AGENT_LOG_PREFIX, ex)
|
|
114
|
+
raise
|
|
115
|
+
|
|
116
|
+
async def conditional_edge(self, state: ToolCallAgentGraphState):
|
|
117
|
+
try:
|
|
118
|
+
logger.debug("%s Starting the Tool Calling Conditional Edge", AGENT_LOG_PREFIX)
|
|
119
|
+
last_message = state.messages[-1]
|
|
120
|
+
if last_message.tool_calls:
|
|
121
|
+
# the agent wants to call a tool
|
|
122
|
+
logger.debug("%s Agent is calling a tool", AGENT_LOG_PREFIX)
|
|
123
|
+
return AgentDecision.TOOL
|
|
124
|
+
if self.detailed_logs:
|
|
125
|
+
logger.debug("%s Final answer:\n%s", AGENT_LOG_PREFIX, state.messages[-1].content)
|
|
126
|
+
return AgentDecision.END
|
|
127
|
+
except Exception as ex:
|
|
128
|
+
logger.exception("%s Failed to determine whether agent is calling a tool: %s", AGENT_LOG_PREFIX, ex)
|
|
129
|
+
logger.warning("%s Ending graph traversal", AGENT_LOG_PREFIX)
|
|
130
|
+
return AgentDecision.END
|
|
131
|
+
|
|
132
|
+
async def tool_node(self, state: ToolCallAgentGraphState):
|
|
133
|
+
try:
|
|
134
|
+
logger.debug("%s Starting Tool Node", AGENT_LOG_PREFIX)
|
|
135
|
+
tool_calls = state.messages[-1].tool_calls
|
|
136
|
+
tools = [tool.get("name") for tool in tool_calls]
|
|
137
|
+
tool_input = state.messages[-1]
|
|
138
|
+
tool_response = await self.tool_caller.ainvoke(
|
|
139
|
+
input={"messages": [tool_input]},
|
|
140
|
+
config=RunnableConfig(callbacks=self.callbacks, configurable={}),
|
|
141
|
+
)
|
|
142
|
+
# this configurable = {} argument is needed due to a bug in LangGraph PreBuilt ToolNode ^
|
|
143
|
+
|
|
144
|
+
for response in tool_response.get("messages"):
|
|
145
|
+
if self.detailed_logs:
|
|
146
|
+
self._log_tool_response(str(tools), str(tool_input), response.content)
|
|
147
|
+
state.messages += [response]
|
|
148
|
+
|
|
149
|
+
return state
|
|
150
|
+
except Exception as ex:
|
|
151
|
+
logger.error("%s Failed to call tool_node: %s", AGENT_LOG_PREFIX, ex)
|
|
152
|
+
raise
|
|
153
|
+
|
|
154
|
+
async def tool_conditional_edge(self, state: ToolCallAgentGraphState) -> AgentDecision:
|
|
155
|
+
"""
|
|
156
|
+
Determines whether to continue to the agent or end graph execution after a tool call.
|
|
157
|
+
|
|
158
|
+
Args:
|
|
159
|
+
state: The current state of the Tool Calling Agent graph containing messages and tool responses.
|
|
160
|
+
|
|
161
|
+
Returns:
|
|
162
|
+
AgentDecision: TOOL to continue to agent for processing, or END to terminate graph execution.
|
|
163
|
+
Returns END if the tool is in return_direct list, otherwise returns TOOL to continue processing.
|
|
164
|
+
"""
|
|
165
|
+
try:
|
|
166
|
+
logger.debug("%s Starting the Tool Conditional Edge", AGENT_LOG_PREFIX)
|
|
167
|
+
if not state.messages:
|
|
168
|
+
logger.debug("%s No messages in state; routing to agent", AGENT_LOG_PREFIX)
|
|
169
|
+
return AgentDecision.TOOL
|
|
170
|
+
|
|
171
|
+
last_message = state.messages[-1]
|
|
172
|
+
# Return directly if this tool is in the return_direct set
|
|
173
|
+
if (self.return_direct and isinstance(last_message, ToolMessage) and last_message.name
|
|
174
|
+
and last_message.name in self.return_direct):
|
|
175
|
+
# Return directly if this tool is in the return_direct list
|
|
176
|
+
logger.debug("%s Tool %s is set to return directly", AGENT_LOG_PREFIX, last_message.name)
|
|
177
|
+
return AgentDecision.END
|
|
178
|
+
else:
|
|
179
|
+
# Continue to agent for processing
|
|
180
|
+
logger.debug("%s Tool response will be processed by agent", AGENT_LOG_PREFIX)
|
|
181
|
+
return AgentDecision.TOOL
|
|
182
|
+
except Exception as ex:
|
|
183
|
+
logger.exception("%s Failed to determine tool conditional edge: %s", AGENT_LOG_PREFIX, ex)
|
|
184
|
+
logger.warning("%s Continuing to agent for processing", AGENT_LOG_PREFIX)
|
|
185
|
+
return AgentDecision.TOOL
|
|
186
|
+
|
|
187
|
+
async def _build_graph(self, state_schema: type) -> CompiledStateGraph:
|
|
188
|
+
try:
|
|
189
|
+
logger.debug("%s Building and compiling the Tool Calling Agent Graph", AGENT_LOG_PREFIX)
|
|
190
|
+
|
|
191
|
+
graph = StateGraph(state_schema)
|
|
192
|
+
graph.add_node("agent", self.agent_node)
|
|
193
|
+
graph.add_node("tool", self.tool_node)
|
|
194
|
+
|
|
195
|
+
if self.return_direct:
|
|
196
|
+
# go to end of graph if tool is set to return directly
|
|
197
|
+
tool_conditional_edge_possible_outputs = {AgentDecision.END: "__end__", AgentDecision.TOOL: "agent"}
|
|
198
|
+
graph.add_conditional_edges("tool", self.tool_conditional_edge, tool_conditional_edge_possible_outputs)
|
|
199
|
+
else:
|
|
200
|
+
# otherwise return to agent after tool call
|
|
201
|
+
graph.add_edge("tool", "agent")
|
|
202
|
+
|
|
203
|
+
conditional_edge_possible_outputs = {AgentDecision.TOOL: "tool", AgentDecision.END: "__end__"}
|
|
204
|
+
graph.add_conditional_edges("agent", self.conditional_edge, conditional_edge_possible_outputs)
|
|
205
|
+
|
|
206
|
+
graph.set_entry_point("agent")
|
|
207
|
+
self.graph = graph.compile()
|
|
208
|
+
|
|
209
|
+
return self.graph
|
|
210
|
+
except Exception as ex:
|
|
211
|
+
logger.error("%s Failed to build Tool Calling Agent Graph: %s", AGENT_LOG_PREFIX, ex)
|
|
212
|
+
raise
|
|
213
|
+
|
|
214
|
+
async def build_graph(self) -> CompiledStateGraph:
|
|
215
|
+
try:
|
|
216
|
+
await self._build_graph(state_schema=ToolCallAgentGraphState)
|
|
217
|
+
logger.debug("%s Tool Calling Agent Graph built and compiled successfully", AGENT_LOG_PREFIX)
|
|
218
|
+
return self.graph
|
|
219
|
+
except Exception as ex:
|
|
220
|
+
logger.error("%s Failed to build Tool Calling Agent Graph: %s", AGENT_LOG_PREFIX, ex)
|
|
221
|
+
raise
|
|
222
|
+
|
|
223
|
+
|
|
224
|
+
def create_tool_calling_agent_prompt(config: "ToolCallAgentWorkflowConfig") -> str | None:
|
|
225
|
+
"""
|
|
226
|
+
Create a Tool Calling Agent prompt from the config.
|
|
227
|
+
|
|
228
|
+
Args:
|
|
229
|
+
config (ToolCallAgentWorkflowConfig): The config to use for the prompt.
|
|
230
|
+
|
|
231
|
+
Returns:
|
|
232
|
+
ChatPromptTemplate: The Tool Calling Agent prompt.
|
|
233
|
+
"""
|
|
234
|
+
# the Tool Calling Agent prompt can be customized via config option system_prompt and additional_instructions.
|
|
235
|
+
|
|
236
|
+
if config.system_prompt:
|
|
237
|
+
prompt_str = config.system_prompt
|
|
238
|
+
else:
|
|
239
|
+
prompt_str = ""
|
|
240
|
+
|
|
241
|
+
if config.additional_instructions:
|
|
242
|
+
prompt_str += f" {config.additional_instructions}"
|
|
243
|
+
|
|
244
|
+
if len(prompt_str) > 0:
|
|
245
|
+
return prompt_str
|
|
246
|
+
return None
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from pydantic import Field
|
|
19
|
+
|
|
20
|
+
from nat.builder.builder import Builder
|
|
21
|
+
from nat.builder.framework_enum import LLMFrameworkEnum
|
|
22
|
+
from nat.builder.function_info import FunctionInfo
|
|
23
|
+
from nat.cli.register_workflow import register_function
|
|
24
|
+
from nat.data_models.agent import AgentBaseConfig
|
|
25
|
+
from nat.data_models.api_server import ChatRequest
|
|
26
|
+
from nat.data_models.api_server import ChatRequestOrMessage
|
|
27
|
+
from nat.data_models.component_ref import FunctionGroupRef
|
|
28
|
+
from nat.data_models.component_ref import FunctionRef
|
|
29
|
+
from nat.utils.type_converter import GlobalTypeConverter
|
|
30
|
+
|
|
31
|
+
logger = logging.getLogger(__name__)
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class ToolCallAgentWorkflowConfig(AgentBaseConfig, name="tool_calling_agent"):
|
|
35
|
+
"""
|
|
36
|
+
A Tool Calling Agent requires an LLM which supports tool calling. A tool Calling Agent utilizes the tool
|
|
37
|
+
input parameters to select the optimal tool. Supports handling tool errors.
|
|
38
|
+
"""
|
|
39
|
+
description: str = Field(default="Tool Calling Agent Workflow", description="Description of this functions use.")
|
|
40
|
+
tool_names: list[FunctionRef | FunctionGroupRef] = Field(
|
|
41
|
+
default_factory=list, description="The list of tools to provide to the tool calling agent.")
|
|
42
|
+
handle_tool_errors: bool = Field(default=True, description="Specify ability to handle tool calling errors.")
|
|
43
|
+
max_iterations: int = Field(default=15, description="Number of tool calls before stoping the tool calling agent.")
|
|
44
|
+
max_history: int = Field(default=15, description="Maximum number of messages to keep in the conversation history.")
|
|
45
|
+
|
|
46
|
+
system_prompt: str | None = Field(default=None, description="Provides the system prompt to use with the agent.")
|
|
47
|
+
additional_instructions: str | None = Field(default=None,
|
|
48
|
+
description="Additional instructions appended to the system prompt.")
|
|
49
|
+
return_direct: list[FunctionRef] | None = Field(
|
|
50
|
+
default=None, description="List of tool names that should return responses directly without LLM processing.")
|
|
51
|
+
|
|
52
|
+
|
|
53
|
+
@register_function(config_type=ToolCallAgentWorkflowConfig, framework_wrappers=[LLMFrameworkEnum.LANGCHAIN])
|
|
54
|
+
async def tool_calling_agent_workflow(config: ToolCallAgentWorkflowConfig, builder: Builder):
|
|
55
|
+
from langchain_core.messages import trim_messages
|
|
56
|
+
from langchain_core.messages.base import BaseMessage
|
|
57
|
+
from langgraph.graph.state import CompiledStateGraph
|
|
58
|
+
|
|
59
|
+
from nat.agent.base import AGENT_LOG_PREFIX
|
|
60
|
+
from nat.agent.tool_calling_agent.agent import ToolCallAgentGraph
|
|
61
|
+
from nat.agent.tool_calling_agent.agent import ToolCallAgentGraphState
|
|
62
|
+
from nat.agent.tool_calling_agent.agent import create_tool_calling_agent_prompt
|
|
63
|
+
|
|
64
|
+
prompt = create_tool_calling_agent_prompt(config)
|
|
65
|
+
# we can choose an LLM for the ReAct agent in the config file
|
|
66
|
+
llm = await builder.get_llm(config.llm_name, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
67
|
+
# the agent can run any installed tool, simply install the tool and add it to the config file
|
|
68
|
+
# the sample tools provided can easily be copied or changed
|
|
69
|
+
tools = await builder.get_tools(tool_names=config.tool_names, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
70
|
+
if not tools:
|
|
71
|
+
raise ValueError(f"No tools specified for Tool Calling Agent '{config.llm_name}'")
|
|
72
|
+
|
|
73
|
+
# convert return_direct FunctionRef objects to BaseTool objects
|
|
74
|
+
return_direct_tools = await builder.get_tools(
|
|
75
|
+
tool_names=config.return_direct, wrapper_type=LLMFrameworkEnum.LANGCHAIN) if config.return_direct else None
|
|
76
|
+
|
|
77
|
+
# construct the Tool Calling Agent Graph from the configured llm, and tools
|
|
78
|
+
graph: CompiledStateGraph = await ToolCallAgentGraph(llm=llm,
|
|
79
|
+
tools=tools,
|
|
80
|
+
prompt=prompt,
|
|
81
|
+
detailed_logs=config.verbose,
|
|
82
|
+
log_response_max_chars=config.log_response_max_chars,
|
|
83
|
+
handle_tool_errors=config.handle_tool_errors,
|
|
84
|
+
return_direct=return_direct_tools).build_graph()
|
|
85
|
+
|
|
86
|
+
async def _response_fn(chat_request_or_message: ChatRequestOrMessage) -> str:
|
|
87
|
+
"""
|
|
88
|
+
Main workflow entry function for the Tool Calling Agent.
|
|
89
|
+
|
|
90
|
+
This function invokes the Tool Calling Agent Graph and returns the response.
|
|
91
|
+
|
|
92
|
+
Args:
|
|
93
|
+
chat_request_or_message (ChatRequestOrMessage): The input message to process
|
|
94
|
+
|
|
95
|
+
Returns:
|
|
96
|
+
str: The response from the agent or error message
|
|
97
|
+
"""
|
|
98
|
+
try:
|
|
99
|
+
message = GlobalTypeConverter.get().convert(chat_request_or_message, to_type=ChatRequest)
|
|
100
|
+
|
|
101
|
+
# initialize the starting state with the user query
|
|
102
|
+
messages: list[BaseMessage] = trim_messages(messages=[m.model_dump() for m in message.messages],
|
|
103
|
+
max_tokens=config.max_history,
|
|
104
|
+
strategy="last",
|
|
105
|
+
token_counter=len,
|
|
106
|
+
start_on="human",
|
|
107
|
+
include_system=True)
|
|
108
|
+
state = ToolCallAgentGraphState(messages=messages)
|
|
109
|
+
|
|
110
|
+
# run the Tool Calling Agent Graph
|
|
111
|
+
state = await graph.ainvoke(state, config={'recursion_limit': (config.max_iterations + 1) * 2})
|
|
112
|
+
# setting recursion_limit: 4 allows 1 tool call
|
|
113
|
+
# - allows the Tool Calling Agent to perform 1 cycle / call 1 single tool,
|
|
114
|
+
# - but stops the agent when it tries to call a tool a second time
|
|
115
|
+
|
|
116
|
+
# get and return the output from the state
|
|
117
|
+
state = ToolCallAgentGraphState(**state)
|
|
118
|
+
output_message = state.messages[-1]
|
|
119
|
+
return str(output_message.content)
|
|
120
|
+
except Exception as ex:
|
|
121
|
+
logger.error("%s Tool Calling Agent failed with exception: %s", AGENT_LOG_PREFIX, ex)
|
|
122
|
+
raise
|
|
123
|
+
|
|
124
|
+
try:
|
|
125
|
+
yield FunctionInfo.from_fn(_response_fn, description=config.description)
|
|
126
|
+
except GeneratorExit:
|
|
127
|
+
logger.exception("%s Workflow exited early!", AGENT_LOG_PREFIX)
|
|
128
|
+
finally:
|
|
129
|
+
logger.debug("%s Cleaning up react_agent workflow.", AGENT_LOG_PREFIX)
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|