nvidia-nat 1.1.0a20251020__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/__init__.py +66 -0
- nat/agent/__init__.py +0 -0
- nat/agent/base.py +265 -0
- nat/agent/dual_node.py +72 -0
- nat/agent/prompt_optimizer/__init__.py +0 -0
- nat/agent/prompt_optimizer/prompt.py +68 -0
- nat/agent/prompt_optimizer/register.py +149 -0
- nat/agent/react_agent/__init__.py +0 -0
- nat/agent/react_agent/agent.py +394 -0
- nat/agent/react_agent/output_parser.py +104 -0
- nat/agent/react_agent/prompt.py +44 -0
- nat/agent/react_agent/register.py +168 -0
- nat/agent/reasoning_agent/__init__.py +0 -0
- nat/agent/reasoning_agent/reasoning_agent.py +227 -0
- nat/agent/register.py +23 -0
- nat/agent/rewoo_agent/__init__.py +0 -0
- nat/agent/rewoo_agent/agent.py +593 -0
- nat/agent/rewoo_agent/prompt.py +107 -0
- nat/agent/rewoo_agent/register.py +175 -0
- nat/agent/tool_calling_agent/__init__.py +0 -0
- nat/agent/tool_calling_agent/agent.py +246 -0
- nat/agent/tool_calling_agent/register.py +129 -0
- nat/authentication/__init__.py +14 -0
- nat/authentication/api_key/__init__.py +14 -0
- nat/authentication/api_key/api_key_auth_provider.py +96 -0
- nat/authentication/api_key/api_key_auth_provider_config.py +124 -0
- nat/authentication/api_key/register.py +26 -0
- nat/authentication/credential_validator/__init__.py +14 -0
- nat/authentication/credential_validator/bearer_token_validator.py +557 -0
- nat/authentication/exceptions/__init__.py +14 -0
- nat/authentication/exceptions/api_key_exceptions.py +38 -0
- nat/authentication/http_basic_auth/__init__.py +0 -0
- nat/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- nat/authentication/http_basic_auth/register.py +30 -0
- nat/authentication/interfaces.py +96 -0
- nat/authentication/oauth2/__init__.py +14 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider.py +140 -0
- nat/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- nat/authentication/oauth2/oauth2_resource_server_config.py +124 -0
- nat/authentication/oauth2/register.py +25 -0
- nat/authentication/register.py +20 -0
- nat/builder/__init__.py +0 -0
- nat/builder/builder.py +317 -0
- nat/builder/component_utils.py +320 -0
- nat/builder/context.py +321 -0
- nat/builder/embedder.py +24 -0
- nat/builder/eval_builder.py +166 -0
- nat/builder/evaluator.py +29 -0
- nat/builder/framework_enum.py +25 -0
- nat/builder/front_end.py +73 -0
- nat/builder/function.py +714 -0
- nat/builder/function_base.py +380 -0
- nat/builder/function_info.py +625 -0
- nat/builder/intermediate_step_manager.py +206 -0
- nat/builder/llm.py +25 -0
- nat/builder/retriever.py +25 -0
- nat/builder/user_interaction_manager.py +78 -0
- nat/builder/workflow.py +160 -0
- nat/builder/workflow_builder.py +1365 -0
- nat/cli/__init__.py +14 -0
- nat/cli/cli_utils/__init__.py +0 -0
- nat/cli/cli_utils/config_override.py +231 -0
- nat/cli/cli_utils/validation.py +37 -0
- nat/cli/commands/__init__.py +0 -0
- nat/cli/commands/configure/__init__.py +0 -0
- nat/cli/commands/configure/channel/__init__.py +0 -0
- nat/cli/commands/configure/channel/add.py +28 -0
- nat/cli/commands/configure/channel/channel.py +34 -0
- nat/cli/commands/configure/channel/remove.py +30 -0
- nat/cli/commands/configure/channel/update.py +30 -0
- nat/cli/commands/configure/configure.py +33 -0
- nat/cli/commands/evaluate.py +139 -0
- nat/cli/commands/info/__init__.py +14 -0
- nat/cli/commands/info/info.py +47 -0
- nat/cli/commands/info/list_channels.py +32 -0
- nat/cli/commands/info/list_components.py +128 -0
- nat/cli/commands/mcp/__init__.py +14 -0
- nat/cli/commands/mcp/mcp.py +986 -0
- nat/cli/commands/object_store/__init__.py +14 -0
- nat/cli/commands/object_store/object_store.py +227 -0
- nat/cli/commands/optimize.py +90 -0
- nat/cli/commands/registry/__init__.py +14 -0
- nat/cli/commands/registry/publish.py +88 -0
- nat/cli/commands/registry/pull.py +118 -0
- nat/cli/commands/registry/registry.py +36 -0
- nat/cli/commands/registry/remove.py +108 -0
- nat/cli/commands/registry/search.py +153 -0
- nat/cli/commands/sizing/__init__.py +14 -0
- nat/cli/commands/sizing/calc.py +297 -0
- nat/cli/commands/sizing/sizing.py +27 -0
- nat/cli/commands/start.py +257 -0
- nat/cli/commands/uninstall.py +81 -0
- nat/cli/commands/validate.py +47 -0
- nat/cli/commands/workflow/__init__.py +14 -0
- nat/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- nat/cli/commands/workflow/templates/config.yml.j2 +17 -0
- nat/cli/commands/workflow/templates/pyproject.toml.j2 +25 -0
- nat/cli/commands/workflow/templates/register.py.j2 +4 -0
- nat/cli/commands/workflow/templates/workflow.py.j2 +50 -0
- nat/cli/commands/workflow/workflow.py +37 -0
- nat/cli/commands/workflow/workflow_commands.py +403 -0
- nat/cli/entrypoint.py +141 -0
- nat/cli/main.py +60 -0
- nat/cli/register_workflow.py +522 -0
- nat/cli/type_registry.py +1069 -0
- nat/control_flow/__init__.py +0 -0
- nat/control_flow/register.py +20 -0
- nat/control_flow/router_agent/__init__.py +0 -0
- nat/control_flow/router_agent/agent.py +329 -0
- nat/control_flow/router_agent/prompt.py +48 -0
- nat/control_flow/router_agent/register.py +91 -0
- nat/control_flow/sequential_executor.py +166 -0
- nat/data_models/__init__.py +14 -0
- nat/data_models/agent.py +34 -0
- nat/data_models/api_server.py +843 -0
- nat/data_models/authentication.py +245 -0
- nat/data_models/common.py +171 -0
- nat/data_models/component.py +60 -0
- nat/data_models/component_ref.py +179 -0
- nat/data_models/config.py +434 -0
- nat/data_models/dataset_handler.py +169 -0
- nat/data_models/discovery_metadata.py +305 -0
- nat/data_models/embedder.py +27 -0
- nat/data_models/evaluate.py +130 -0
- nat/data_models/evaluator.py +26 -0
- nat/data_models/front_end.py +26 -0
- nat/data_models/function.py +64 -0
- nat/data_models/function_dependencies.py +80 -0
- nat/data_models/gated_field_mixin.py +242 -0
- nat/data_models/interactive.py +246 -0
- nat/data_models/intermediate_step.py +302 -0
- nat/data_models/invocation_node.py +38 -0
- nat/data_models/llm.py +27 -0
- nat/data_models/logging.py +26 -0
- nat/data_models/memory.py +27 -0
- nat/data_models/object_store.py +44 -0
- nat/data_models/optimizable.py +119 -0
- nat/data_models/optimizer.py +149 -0
- nat/data_models/profiler.py +54 -0
- nat/data_models/registry_handler.py +26 -0
- nat/data_models/retriever.py +30 -0
- nat/data_models/retry_mixin.py +35 -0
- nat/data_models/span.py +228 -0
- nat/data_models/step_adaptor.py +64 -0
- nat/data_models/streaming.py +33 -0
- nat/data_models/swe_bench_model.py +54 -0
- nat/data_models/telemetry_exporter.py +26 -0
- nat/data_models/temperature_mixin.py +44 -0
- nat/data_models/thinking_mixin.py +86 -0
- nat/data_models/top_p_mixin.py +44 -0
- nat/data_models/ttc_strategy.py +30 -0
- nat/embedder/__init__.py +0 -0
- nat/embedder/azure_openai_embedder.py +46 -0
- nat/embedder/nim_embedder.py +59 -0
- nat/embedder/openai_embedder.py +42 -0
- nat/embedder/register.py +22 -0
- nat/eval/__init__.py +14 -0
- nat/eval/config.py +62 -0
- nat/eval/dataset_handler/__init__.py +0 -0
- nat/eval/dataset_handler/dataset_downloader.py +106 -0
- nat/eval/dataset_handler/dataset_filter.py +52 -0
- nat/eval/dataset_handler/dataset_handler.py +431 -0
- nat/eval/evaluate.py +565 -0
- nat/eval/evaluator/__init__.py +14 -0
- nat/eval/evaluator/base_evaluator.py +77 -0
- nat/eval/evaluator/evaluator_model.py +58 -0
- nat/eval/intermediate_step_adapter.py +99 -0
- nat/eval/rag_evaluator/__init__.py +0 -0
- nat/eval/rag_evaluator/evaluate.py +178 -0
- nat/eval/rag_evaluator/register.py +143 -0
- nat/eval/register.py +26 -0
- nat/eval/remote_workflow.py +133 -0
- nat/eval/runners/__init__.py +14 -0
- nat/eval/runners/config.py +39 -0
- nat/eval/runners/multi_eval_runner.py +54 -0
- nat/eval/runtime_evaluator/__init__.py +14 -0
- nat/eval/runtime_evaluator/evaluate.py +123 -0
- nat/eval/runtime_evaluator/register.py +100 -0
- nat/eval/runtime_event_subscriber.py +52 -0
- nat/eval/swe_bench_evaluator/__init__.py +0 -0
- nat/eval/swe_bench_evaluator/evaluate.py +215 -0
- nat/eval/swe_bench_evaluator/register.py +36 -0
- nat/eval/trajectory_evaluator/__init__.py +0 -0
- nat/eval/trajectory_evaluator/evaluate.py +75 -0
- nat/eval/trajectory_evaluator/register.py +40 -0
- nat/eval/tunable_rag_evaluator/__init__.py +0 -0
- nat/eval/tunable_rag_evaluator/evaluate.py +242 -0
- nat/eval/tunable_rag_evaluator/register.py +52 -0
- nat/eval/usage_stats.py +41 -0
- nat/eval/utils/__init__.py +0 -0
- nat/eval/utils/eval_trace_ctx.py +89 -0
- nat/eval/utils/output_uploader.py +140 -0
- nat/eval/utils/tqdm_position_registry.py +40 -0
- nat/eval/utils/weave_eval.py +193 -0
- nat/experimental/__init__.py +0 -0
- nat/experimental/decorators/__init__.py +0 -0
- nat/experimental/decorators/experimental_warning_decorator.py +154 -0
- nat/experimental/test_time_compute/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/__init__.py +0 -0
- nat/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- nat/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- nat/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- nat/experimental/test_time_compute/functions/__init__.py +0 -0
- nat/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- nat/experimental/test_time_compute/functions/plan_select_execute_function.py +228 -0
- nat/experimental/test_time_compute/functions/ttc_tool_orchestration_function.py +205 -0
- nat/experimental/test_time_compute/functions/ttc_tool_wrapper_function.py +146 -0
- nat/experimental/test_time_compute/models/__init__.py +0 -0
- nat/experimental/test_time_compute/models/editor_config.py +132 -0
- nat/experimental/test_time_compute/models/scoring_config.py +112 -0
- nat/experimental/test_time_compute/models/search_config.py +120 -0
- nat/experimental/test_time_compute/models/selection_config.py +154 -0
- nat/experimental/test_time_compute/models/stage_enums.py +43 -0
- nat/experimental/test_time_compute/models/strategy_base.py +67 -0
- nat/experimental/test_time_compute/models/tool_use_config.py +41 -0
- nat/experimental/test_time_compute/models/ttc_item.py +48 -0
- nat/experimental/test_time_compute/register.py +35 -0
- nat/experimental/test_time_compute/scoring/__init__.py +0 -0
- nat/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- nat/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- nat/experimental/test_time_compute/search/__init__.py +0 -0
- nat/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- nat/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- nat/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- nat/experimental/test_time_compute/selection/__init__.py +0 -0
- nat/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- nat/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- nat/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +157 -0
- nat/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- nat/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- nat/front_ends/__init__.py +14 -0
- nat/front_ends/console/__init__.py +14 -0
- nat/front_ends/console/authentication_flow_handler.py +285 -0
- nat/front_ends/console/console_front_end_config.py +32 -0
- nat/front_ends/console/console_front_end_plugin.py +108 -0
- nat/front_ends/console/register.py +25 -0
- nat/front_ends/cron/__init__.py +14 -0
- nat/front_ends/fastapi/__init__.py +14 -0
- nat/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- nat/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- nat/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +142 -0
- nat/front_ends/fastapi/dask_client_mixin.py +65 -0
- nat/front_ends/fastapi/fastapi_front_end_config.py +272 -0
- nat/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin.py +247 -0
- nat/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1257 -0
- nat/front_ends/fastapi/html_snippets/__init__.py +14 -0
- nat/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- nat/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- nat/front_ends/fastapi/job_store.py +602 -0
- nat/front_ends/fastapi/main.py +64 -0
- nat/front_ends/fastapi/message_handler.py +344 -0
- nat/front_ends/fastapi/message_validator.py +351 -0
- nat/front_ends/fastapi/register.py +25 -0
- nat/front_ends/fastapi/response_helpers.py +195 -0
- nat/front_ends/fastapi/step_adaptor.py +319 -0
- nat/front_ends/fastapi/utils.py +57 -0
- nat/front_ends/mcp/__init__.py +14 -0
- nat/front_ends/mcp/introspection_token_verifier.py +73 -0
- nat/front_ends/mcp/mcp_front_end_config.py +90 -0
- nat/front_ends/mcp/mcp_front_end_plugin.py +113 -0
- nat/front_ends/mcp/mcp_front_end_plugin_worker.py +268 -0
- nat/front_ends/mcp/memory_profiler.py +320 -0
- nat/front_ends/mcp/register.py +27 -0
- nat/front_ends/mcp/tool_converter.py +290 -0
- nat/front_ends/register.py +21 -0
- nat/front_ends/simple_base/__init__.py +14 -0
- nat/front_ends/simple_base/simple_front_end_plugin_base.py +56 -0
- nat/llm/__init__.py +0 -0
- nat/llm/aws_bedrock_llm.py +69 -0
- nat/llm/azure_openai_llm.py +57 -0
- nat/llm/litellm_llm.py +69 -0
- nat/llm/nim_llm.py +58 -0
- nat/llm/openai_llm.py +54 -0
- nat/llm/register.py +27 -0
- nat/llm/utils/__init__.py +14 -0
- nat/llm/utils/env_config_value.py +93 -0
- nat/llm/utils/error.py +17 -0
- nat/llm/utils/thinking.py +215 -0
- nat/memory/__init__.py +20 -0
- nat/memory/interfaces.py +183 -0
- nat/memory/models.py +112 -0
- nat/meta/pypi.md +58 -0
- nat/object_store/__init__.py +20 -0
- nat/object_store/in_memory_object_store.py +76 -0
- nat/object_store/interfaces.py +84 -0
- nat/object_store/models.py +38 -0
- nat/object_store/register.py +19 -0
- nat/observability/__init__.py +14 -0
- nat/observability/exporter/__init__.py +14 -0
- nat/observability/exporter/base_exporter.py +449 -0
- nat/observability/exporter/exporter.py +78 -0
- nat/observability/exporter/file_exporter.py +33 -0
- nat/observability/exporter/processing_exporter.py +550 -0
- nat/observability/exporter/raw_exporter.py +52 -0
- nat/observability/exporter/span_exporter.py +308 -0
- nat/observability/exporter_manager.py +335 -0
- nat/observability/mixin/__init__.py +14 -0
- nat/observability/mixin/batch_config_mixin.py +26 -0
- nat/observability/mixin/collector_config_mixin.py +23 -0
- nat/observability/mixin/file_mixin.py +288 -0
- nat/observability/mixin/file_mode.py +23 -0
- nat/observability/mixin/redaction_config_mixin.py +42 -0
- nat/observability/mixin/resource_conflict_mixin.py +134 -0
- nat/observability/mixin/serialize_mixin.py +61 -0
- nat/observability/mixin/tagging_config_mixin.py +62 -0
- nat/observability/mixin/type_introspection_mixin.py +496 -0
- nat/observability/processor/__init__.py +14 -0
- nat/observability/processor/batching_processor.py +308 -0
- nat/observability/processor/callback_processor.py +42 -0
- nat/observability/processor/falsy_batch_filter_processor.py +55 -0
- nat/observability/processor/intermediate_step_serializer.py +28 -0
- nat/observability/processor/processor.py +74 -0
- nat/observability/processor/processor_factory.py +70 -0
- nat/observability/processor/redaction/__init__.py +24 -0
- nat/observability/processor/redaction/contextual_redaction_processor.py +125 -0
- nat/observability/processor/redaction/contextual_span_redaction_processor.py +66 -0
- nat/observability/processor/redaction/redaction_processor.py +177 -0
- nat/observability/processor/redaction/span_header_redaction_processor.py +92 -0
- nat/observability/processor/span_tagging_processor.py +68 -0
- nat/observability/register.py +114 -0
- nat/observability/utils/__init__.py +14 -0
- nat/observability/utils/dict_utils.py +236 -0
- nat/observability/utils/time_utils.py +31 -0
- nat/plugins/.namespace +1 -0
- nat/profiler/__init__.py +0 -0
- nat/profiler/calc/__init__.py +14 -0
- nat/profiler/calc/calc_runner.py +626 -0
- nat/profiler/calc/calculations.py +288 -0
- nat/profiler/calc/data_models.py +188 -0
- nat/profiler/calc/plot.py +345 -0
- nat/profiler/callbacks/__init__.py +0 -0
- nat/profiler/callbacks/agno_callback_handler.py +295 -0
- nat/profiler/callbacks/base_callback_class.py +20 -0
- nat/profiler/callbacks/langchain_callback_handler.py +297 -0
- nat/profiler/callbacks/llama_index_callback_handler.py +205 -0
- nat/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- nat/profiler/callbacks/token_usage_base_model.py +27 -0
- nat/profiler/data_frame_row.py +51 -0
- nat/profiler/data_models.py +24 -0
- nat/profiler/decorators/__init__.py +0 -0
- nat/profiler/decorators/framework_wrapper.py +180 -0
- nat/profiler/decorators/function_tracking.py +411 -0
- nat/profiler/forecasting/__init__.py +0 -0
- nat/profiler/forecasting/config.py +18 -0
- nat/profiler/forecasting/model_trainer.py +75 -0
- nat/profiler/forecasting/models/__init__.py +22 -0
- nat/profiler/forecasting/models/forecasting_base_model.py +42 -0
- nat/profiler/forecasting/models/linear_model.py +197 -0
- nat/profiler/forecasting/models/random_forest_regressor.py +269 -0
- nat/profiler/inference_metrics_model.py +28 -0
- nat/profiler/inference_optimization/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- nat/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- nat/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- nat/profiler/inference_optimization/data_models.py +386 -0
- nat/profiler/inference_optimization/experimental/__init__.py +0 -0
- nat/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- nat/profiler/inference_optimization/experimental/prefix_span_analysis.py +404 -0
- nat/profiler/inference_optimization/llm_metrics.py +212 -0
- nat/profiler/inference_optimization/prompt_caching.py +163 -0
- nat/profiler/inference_optimization/token_uniqueness.py +107 -0
- nat/profiler/inference_optimization/workflow_runtimes.py +72 -0
- nat/profiler/intermediate_property_adapter.py +102 -0
- nat/profiler/parameter_optimization/__init__.py +0 -0
- nat/profiler/parameter_optimization/optimizable_utils.py +93 -0
- nat/profiler/parameter_optimization/optimizer_runtime.py +67 -0
- nat/profiler/parameter_optimization/parameter_optimizer.py +153 -0
- nat/profiler/parameter_optimization/parameter_selection.py +107 -0
- nat/profiler/parameter_optimization/pareto_visualizer.py +380 -0
- nat/profiler/parameter_optimization/prompt_optimizer.py +384 -0
- nat/profiler/parameter_optimization/update_helpers.py +66 -0
- nat/profiler/profile_runner.py +478 -0
- nat/profiler/utils.py +186 -0
- nat/registry_handlers/__init__.py +0 -0
- nat/registry_handlers/local/__init__.py +0 -0
- nat/registry_handlers/local/local_handler.py +176 -0
- nat/registry_handlers/local/register_local.py +37 -0
- nat/registry_handlers/metadata_factory.py +60 -0
- nat/registry_handlers/package_utils.py +570 -0
- nat/registry_handlers/pypi/__init__.py +0 -0
- nat/registry_handlers/pypi/pypi_handler.py +248 -0
- nat/registry_handlers/pypi/register_pypi.py +40 -0
- nat/registry_handlers/register.py +20 -0
- nat/registry_handlers/registry_handler_base.py +157 -0
- nat/registry_handlers/rest/__init__.py +0 -0
- nat/registry_handlers/rest/register_rest.py +56 -0
- nat/registry_handlers/rest/rest_handler.py +236 -0
- nat/registry_handlers/schemas/__init__.py +0 -0
- nat/registry_handlers/schemas/headers.py +42 -0
- nat/registry_handlers/schemas/package.py +68 -0
- nat/registry_handlers/schemas/publish.py +68 -0
- nat/registry_handlers/schemas/pull.py +82 -0
- nat/registry_handlers/schemas/remove.py +36 -0
- nat/registry_handlers/schemas/search.py +91 -0
- nat/registry_handlers/schemas/status.py +47 -0
- nat/retriever/__init__.py +0 -0
- nat/retriever/interface.py +41 -0
- nat/retriever/milvus/__init__.py +14 -0
- nat/retriever/milvus/register.py +81 -0
- nat/retriever/milvus/retriever.py +228 -0
- nat/retriever/models.py +77 -0
- nat/retriever/nemo_retriever/__init__.py +14 -0
- nat/retriever/nemo_retriever/register.py +60 -0
- nat/retriever/nemo_retriever/retriever.py +190 -0
- nat/retriever/register.py +21 -0
- nat/runtime/__init__.py +14 -0
- nat/runtime/loader.py +220 -0
- nat/runtime/runner.py +292 -0
- nat/runtime/session.py +223 -0
- nat/runtime/user_metadata.py +130 -0
- nat/settings/__init__.py +0 -0
- nat/settings/global_settings.py +329 -0
- nat/test/.namespace +1 -0
- nat/tool/__init__.py +0 -0
- nat/tool/chat_completion.py +77 -0
- nat/tool/code_execution/README.md +151 -0
- nat/tool/code_execution/__init__.py +0 -0
- nat/tool/code_execution/code_sandbox.py +267 -0
- nat/tool/code_execution/local_sandbox/.gitignore +1 -0
- nat/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- nat/tool/code_execution/local_sandbox/__init__.py +13 -0
- nat/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- nat/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- nat/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- nat/tool/code_execution/register.py +74 -0
- nat/tool/code_execution/test_code_execution_sandbox.py +414 -0
- nat/tool/code_execution/utils.py +100 -0
- nat/tool/datetime_tools.py +82 -0
- nat/tool/document_search.py +141 -0
- nat/tool/github_tools.py +450 -0
- nat/tool/memory_tools/__init__.py +0 -0
- nat/tool/memory_tools/add_memory_tool.py +79 -0
- nat/tool/memory_tools/delete_memory_tool.py +66 -0
- nat/tool/memory_tools/get_memory_tool.py +72 -0
- nat/tool/nvidia_rag.py +95 -0
- nat/tool/register.py +31 -0
- nat/tool/retriever.py +95 -0
- nat/tool/server_tools.py +66 -0
- nat/utils/__init__.py +0 -0
- nat/utils/callable_utils.py +70 -0
- nat/utils/data_models/__init__.py +0 -0
- nat/utils/data_models/schema_validator.py +58 -0
- nat/utils/debugging_utils.py +43 -0
- nat/utils/decorators.py +210 -0
- nat/utils/dump_distro_mapping.py +32 -0
- nat/utils/exception_handlers/__init__.py +0 -0
- nat/utils/exception_handlers/automatic_retries.py +342 -0
- nat/utils/exception_handlers/schemas.py +114 -0
- nat/utils/io/__init__.py +0 -0
- nat/utils/io/model_processing.py +28 -0
- nat/utils/io/yaml_tools.py +119 -0
- nat/utils/log_levels.py +25 -0
- nat/utils/log_utils.py +37 -0
- nat/utils/metadata_utils.py +74 -0
- nat/utils/optional_imports.py +142 -0
- nat/utils/producer_consumer_queue.py +178 -0
- nat/utils/reactive/__init__.py +0 -0
- nat/utils/reactive/base/__init__.py +0 -0
- nat/utils/reactive/base/observable_base.py +65 -0
- nat/utils/reactive/base/observer_base.py +55 -0
- nat/utils/reactive/base/subject_base.py +79 -0
- nat/utils/reactive/observable.py +59 -0
- nat/utils/reactive/observer.py +76 -0
- nat/utils/reactive/subject.py +131 -0
- nat/utils/reactive/subscription.py +49 -0
- nat/utils/settings/__init__.py +0 -0
- nat/utils/settings/global_settings.py +195 -0
- nat/utils/string_utils.py +38 -0
- nat/utils/type_converter.py +299 -0
- nat/utils/type_utils.py +488 -0
- nat/utils/url_utils.py +27 -0
- nvidia_nat-1.1.0a20251020.dist-info/METADATA +195 -0
- nvidia_nat-1.1.0a20251020.dist-info/RECORD +480 -0
- nvidia_nat-1.1.0a20251020.dist-info/WHEEL +5 -0
- nvidia_nat-1.1.0a20251020.dist-info/entry_points.txt +22 -0
- nvidia_nat-1.1.0a20251020.dist-info/licenses/LICENSE-3rd-party.txt +5478 -0
- nvidia_nat-1.1.0a20251020.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.1.0a20251020.dist-info/top_level.txt +2 -0
|
@@ -0,0 +1,268 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
from abc import ABC
|
|
18
|
+
from abc import abstractmethod
|
|
19
|
+
from collections.abc import Mapping
|
|
20
|
+
from typing import Any
|
|
21
|
+
|
|
22
|
+
from mcp.server.fastmcp import FastMCP
|
|
23
|
+
from starlette.exceptions import HTTPException
|
|
24
|
+
from starlette.requests import Request
|
|
25
|
+
|
|
26
|
+
from nat.builder.function import Function
|
|
27
|
+
from nat.builder.function_base import FunctionBase
|
|
28
|
+
from nat.builder.workflow import Workflow
|
|
29
|
+
from nat.builder.workflow_builder import WorkflowBuilder
|
|
30
|
+
from nat.data_models.config import Config
|
|
31
|
+
from nat.front_ends.mcp.mcp_front_end_config import MCPFrontEndConfig
|
|
32
|
+
from nat.front_ends.mcp.memory_profiler import MemoryProfiler
|
|
33
|
+
|
|
34
|
+
logger = logging.getLogger(__name__)
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
class MCPFrontEndPluginWorkerBase(ABC):
|
|
38
|
+
"""Base class for MCP front end plugin workers."""
|
|
39
|
+
|
|
40
|
+
def __init__(self, config: Config):
|
|
41
|
+
"""Initialize the MCP worker with configuration.
|
|
42
|
+
|
|
43
|
+
Args:
|
|
44
|
+
config: The full NAT configuration
|
|
45
|
+
"""
|
|
46
|
+
self.full_config = config
|
|
47
|
+
self.front_end_config: MCPFrontEndConfig = config.general.front_end
|
|
48
|
+
|
|
49
|
+
# Initialize memory profiler if enabled
|
|
50
|
+
self.memory_profiler = MemoryProfiler(enabled=self.front_end_config.enable_memory_profiling,
|
|
51
|
+
log_interval=self.front_end_config.memory_profile_interval,
|
|
52
|
+
top_n=self.front_end_config.memory_profile_top_n,
|
|
53
|
+
log_level=self.front_end_config.memory_profile_log_level)
|
|
54
|
+
|
|
55
|
+
def _setup_health_endpoint(self, mcp: FastMCP):
|
|
56
|
+
"""Set up the HTTP health endpoint that exercises MCP ping handler."""
|
|
57
|
+
|
|
58
|
+
@mcp.custom_route("/health", methods=["GET"])
|
|
59
|
+
async def health_check(_request: Request):
|
|
60
|
+
"""HTTP health check using server's internal ping handler"""
|
|
61
|
+
from starlette.responses import JSONResponse
|
|
62
|
+
|
|
63
|
+
try:
|
|
64
|
+
from mcp.types import PingRequest
|
|
65
|
+
|
|
66
|
+
# Create a ping request
|
|
67
|
+
ping_request = PingRequest(method="ping")
|
|
68
|
+
|
|
69
|
+
# Call the ping handler directly (same one that responds to MCP pings)
|
|
70
|
+
await mcp._mcp_server.request_handlers[PingRequest](ping_request)
|
|
71
|
+
|
|
72
|
+
return JSONResponse({
|
|
73
|
+
"status": "healthy",
|
|
74
|
+
"error": None,
|
|
75
|
+
"server_name": mcp.name,
|
|
76
|
+
})
|
|
77
|
+
|
|
78
|
+
except Exception as e:
|
|
79
|
+
return JSONResponse({
|
|
80
|
+
"status": "unhealthy",
|
|
81
|
+
"error": str(e),
|
|
82
|
+
"server_name": mcp.name,
|
|
83
|
+
},
|
|
84
|
+
status_code=503)
|
|
85
|
+
|
|
86
|
+
@abstractmethod
|
|
87
|
+
async def add_routes(self, mcp: FastMCP, builder: WorkflowBuilder):
|
|
88
|
+
"""Add routes to the MCP server.
|
|
89
|
+
|
|
90
|
+
Args:
|
|
91
|
+
mcp: The FastMCP server instance
|
|
92
|
+
builder (WorkflowBuilder): The workflow builder instance
|
|
93
|
+
"""
|
|
94
|
+
pass
|
|
95
|
+
|
|
96
|
+
async def _get_all_functions(self, workflow: Workflow) -> dict[str, Function]:
|
|
97
|
+
"""Get all functions from the workflow.
|
|
98
|
+
|
|
99
|
+
Args:
|
|
100
|
+
workflow: The NAT workflow.
|
|
101
|
+
|
|
102
|
+
Returns:
|
|
103
|
+
Dict mapping function names to Function objects.
|
|
104
|
+
"""
|
|
105
|
+
functions: dict[str, Function] = {}
|
|
106
|
+
|
|
107
|
+
# Extract all functions from the workflow
|
|
108
|
+
functions.update(workflow.functions)
|
|
109
|
+
for function_group in workflow.function_groups.values():
|
|
110
|
+
functions.update(await function_group.get_accessible_functions())
|
|
111
|
+
|
|
112
|
+
if workflow.config.workflow.workflow_alias:
|
|
113
|
+
functions[workflow.config.workflow.workflow_alias] = workflow
|
|
114
|
+
else:
|
|
115
|
+
functions[workflow.config.workflow.type] = workflow
|
|
116
|
+
|
|
117
|
+
return functions
|
|
118
|
+
|
|
119
|
+
def _setup_debug_endpoints(self, mcp: FastMCP, functions: Mapping[str, FunctionBase]) -> None:
|
|
120
|
+
"""Set up HTTP debug endpoints for introspecting tools and schemas.
|
|
121
|
+
|
|
122
|
+
Exposes:
|
|
123
|
+
- GET /debug/tools/list: List tools. Optional query param `name` (one or more, repeatable or comma separated)
|
|
124
|
+
selects a subset and returns details for those tools.
|
|
125
|
+
- GET /debug/memory/stats: Get current memory profiling statistics (read-only)
|
|
126
|
+
"""
|
|
127
|
+
|
|
128
|
+
@mcp.custom_route("/debug/tools/list", methods=["GET"])
|
|
129
|
+
async def list_tools(request: Request):
|
|
130
|
+
"""HTTP list tools endpoint."""
|
|
131
|
+
|
|
132
|
+
from starlette.responses import JSONResponse
|
|
133
|
+
|
|
134
|
+
from nat.front_ends.mcp.tool_converter import get_function_description
|
|
135
|
+
|
|
136
|
+
# Query params
|
|
137
|
+
# Support repeated names and comma-separated lists
|
|
138
|
+
names_param_list = set(request.query_params.getlist("name"))
|
|
139
|
+
names: list[str] = []
|
|
140
|
+
for raw in names_param_list:
|
|
141
|
+
# if p.strip() is empty, it won't be included in the list!
|
|
142
|
+
parts = [p.strip() for p in raw.split(",") if p.strip()]
|
|
143
|
+
names.extend(parts)
|
|
144
|
+
detail_raw = request.query_params.get("detail")
|
|
145
|
+
|
|
146
|
+
def _parse_detail_param(detail_param: str | None, has_names: bool) -> bool:
|
|
147
|
+
if detail_param is None:
|
|
148
|
+
if has_names:
|
|
149
|
+
return True
|
|
150
|
+
return False
|
|
151
|
+
v = detail_param.strip().lower()
|
|
152
|
+
if v in ("0", "false", "no", "off"):
|
|
153
|
+
return False
|
|
154
|
+
if v in ("1", "true", "yes", "on"):
|
|
155
|
+
return True
|
|
156
|
+
# For invalid values, default based on whether names are present
|
|
157
|
+
return has_names
|
|
158
|
+
|
|
159
|
+
# Helper function to build the input schema info
|
|
160
|
+
def _build_schema_info(fn: FunctionBase) -> dict[str, Any] | None:
|
|
161
|
+
schema = getattr(fn, "input_schema", None)
|
|
162
|
+
if schema is None:
|
|
163
|
+
return None
|
|
164
|
+
|
|
165
|
+
# check if schema is a ChatRequest
|
|
166
|
+
schema_name = getattr(schema, "__name__", "")
|
|
167
|
+
schema_qualname = getattr(schema, "__qualname__", "")
|
|
168
|
+
if "ChatRequest" in schema_name or "ChatRequest" in schema_qualname:
|
|
169
|
+
# Simplified interface used by MCP wrapper for ChatRequest
|
|
170
|
+
return {
|
|
171
|
+
"type": "object",
|
|
172
|
+
"properties": {
|
|
173
|
+
"query": {
|
|
174
|
+
"type": "string", "description": "User query string"
|
|
175
|
+
}
|
|
176
|
+
},
|
|
177
|
+
"required": ["query"],
|
|
178
|
+
"title": "ChatRequestQuery",
|
|
179
|
+
}
|
|
180
|
+
|
|
181
|
+
# Pydantic models provide model_json_schema
|
|
182
|
+
if schema is not None and hasattr(schema, "model_json_schema"):
|
|
183
|
+
return schema.model_json_schema()
|
|
184
|
+
|
|
185
|
+
return None
|
|
186
|
+
|
|
187
|
+
def _build_final_json(functions_to_include: Mapping[str, FunctionBase],
|
|
188
|
+
include_schemas: bool = False) -> dict[str, Any]:
|
|
189
|
+
tools = []
|
|
190
|
+
for name, fn in functions_to_include.items():
|
|
191
|
+
list_entry: dict[str, Any] = {
|
|
192
|
+
"name": name, "description": get_function_description(fn), "is_workflow": hasattr(fn, "run")
|
|
193
|
+
}
|
|
194
|
+
if include_schemas:
|
|
195
|
+
list_entry["schema"] = _build_schema_info(fn)
|
|
196
|
+
tools.append(list_entry)
|
|
197
|
+
|
|
198
|
+
return {
|
|
199
|
+
"count": len(tools),
|
|
200
|
+
"tools": tools,
|
|
201
|
+
"server_name": mcp.name,
|
|
202
|
+
}
|
|
203
|
+
|
|
204
|
+
if names:
|
|
205
|
+
# Return selected tools
|
|
206
|
+
try:
|
|
207
|
+
functions_to_include = {n: functions[n] for n in names}
|
|
208
|
+
except KeyError as e:
|
|
209
|
+
raise HTTPException(status_code=404, detail=f"Tool \"{e.args[0]}\" not found.") from e
|
|
210
|
+
else:
|
|
211
|
+
functions_to_include = functions
|
|
212
|
+
|
|
213
|
+
# Default for listing all: detail defaults to False unless explicitly set true
|
|
214
|
+
return JSONResponse(
|
|
215
|
+
_build_final_json(functions_to_include, _parse_detail_param(detail_raw, has_names=bool(names))))
|
|
216
|
+
|
|
217
|
+
# Memory profiling endpoint (read-only)
|
|
218
|
+
@mcp.custom_route("/debug/memory/stats", methods=["GET"])
|
|
219
|
+
async def get_memory_stats(_request: Request):
|
|
220
|
+
"""Get current memory profiling statistics."""
|
|
221
|
+
from starlette.responses import JSONResponse
|
|
222
|
+
|
|
223
|
+
stats = self.memory_profiler.get_stats()
|
|
224
|
+
return JSONResponse(stats)
|
|
225
|
+
|
|
226
|
+
|
|
227
|
+
class MCPFrontEndPluginWorker(MCPFrontEndPluginWorkerBase):
|
|
228
|
+
"""Default MCP front end plugin worker implementation."""
|
|
229
|
+
|
|
230
|
+
async def add_routes(self, mcp: FastMCP, builder: WorkflowBuilder):
|
|
231
|
+
"""Add default routes to the MCP server.
|
|
232
|
+
|
|
233
|
+
Args:
|
|
234
|
+
mcp: The FastMCP server instance
|
|
235
|
+
builder (WorkflowBuilder): The workflow builder instance
|
|
236
|
+
"""
|
|
237
|
+
from nat.front_ends.mcp.tool_converter import register_function_with_mcp
|
|
238
|
+
|
|
239
|
+
# Set up the health endpoint
|
|
240
|
+
self._setup_health_endpoint(mcp)
|
|
241
|
+
|
|
242
|
+
# Build the workflow and register all functions with MCP
|
|
243
|
+
workflow = await builder.build()
|
|
244
|
+
|
|
245
|
+
# Get all functions from the workflow
|
|
246
|
+
functions = await self._get_all_functions(workflow)
|
|
247
|
+
|
|
248
|
+
# Filter functions based on tool_names if provided
|
|
249
|
+
if self.front_end_config.tool_names:
|
|
250
|
+
logger.info("Filtering functions based on tool_names: %s", self.front_end_config.tool_names)
|
|
251
|
+
filtered_functions: dict[str, Function] = {}
|
|
252
|
+
for function_name, function in functions.items():
|
|
253
|
+
if function_name in self.front_end_config.tool_names:
|
|
254
|
+
filtered_functions[function_name] = function
|
|
255
|
+
else:
|
|
256
|
+
logger.debug("Skipping function %s as it's not in tool_names", function_name)
|
|
257
|
+
functions = filtered_functions
|
|
258
|
+
|
|
259
|
+
# Register each function with MCP, passing workflow context for observability
|
|
260
|
+
for function_name, function in functions.items():
|
|
261
|
+
register_function_with_mcp(mcp, function_name, function, workflow, self.memory_profiler)
|
|
262
|
+
|
|
263
|
+
# Add a simple fallback function if no functions were found
|
|
264
|
+
if not functions:
|
|
265
|
+
raise RuntimeError("No functions found in workflow. Please check your configuration.")
|
|
266
|
+
|
|
267
|
+
# After registration, expose debug endpoints for tool/schema inspection
|
|
268
|
+
self._setup_debug_endpoints(mcp, functions)
|
|
@@ -0,0 +1,320 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
"""Memory profiling utilities for MCP frontend."""
|
|
16
|
+
|
|
17
|
+
import gc
|
|
18
|
+
import logging
|
|
19
|
+
import tracemalloc
|
|
20
|
+
from typing import Any
|
|
21
|
+
|
|
22
|
+
logger = logging.getLogger(__name__)
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
class MemoryProfiler:
|
|
26
|
+
"""Memory profiler for tracking memory usage and potential leaks."""
|
|
27
|
+
|
|
28
|
+
def __init__(self, enabled: bool = False, log_interval: int = 50, top_n: int = 10, log_level: str = "DEBUG"):
|
|
29
|
+
"""Initialize the memory profiler.
|
|
30
|
+
|
|
31
|
+
Args:
|
|
32
|
+
enabled: Whether memory profiling is enabled
|
|
33
|
+
log_interval: Log stats every N requests
|
|
34
|
+
top_n: Number of top allocations to log
|
|
35
|
+
log_level: Log level for memory profiling output (e.g., "DEBUG", "INFO")
|
|
36
|
+
"""
|
|
37
|
+
self.enabled = enabled
|
|
38
|
+
# normalize interval to avoid modulo-by-zero
|
|
39
|
+
self.log_interval = max(1, int(log_interval))
|
|
40
|
+
self.top_n = top_n
|
|
41
|
+
self.log_level = getattr(logging, log_level.upper(), logging.DEBUG)
|
|
42
|
+
self.request_count = 0
|
|
43
|
+
self.baseline_snapshot = None
|
|
44
|
+
|
|
45
|
+
# Track whether this instance started tracemalloc (to avoid resetting external tracing)
|
|
46
|
+
self._we_started_tracemalloc = False
|
|
47
|
+
|
|
48
|
+
if self.enabled:
|
|
49
|
+
logger.info("Memory profiling ENABLED (interval=%d, top_n=%d, log_level=%s)",
|
|
50
|
+
self.log_interval,
|
|
51
|
+
top_n,
|
|
52
|
+
log_level)
|
|
53
|
+
try:
|
|
54
|
+
if not tracemalloc.is_tracing():
|
|
55
|
+
tracemalloc.start()
|
|
56
|
+
self._we_started_tracemalloc = True
|
|
57
|
+
# Take baseline snapshot
|
|
58
|
+
gc.collect()
|
|
59
|
+
self.baseline_snapshot = tracemalloc.take_snapshot()
|
|
60
|
+
except RuntimeError as e:
|
|
61
|
+
logger.warning("tracemalloc unavailable or not tracing: %s", e)
|
|
62
|
+
else:
|
|
63
|
+
logger.info("Memory profiling DISABLED")
|
|
64
|
+
|
|
65
|
+
def _log(self, message: str, *args: Any) -> None:
|
|
66
|
+
"""Log a message at the configured log level.
|
|
67
|
+
|
|
68
|
+
Args:
|
|
69
|
+
message: Log message format string
|
|
70
|
+
args: Arguments for the format string
|
|
71
|
+
"""
|
|
72
|
+
logger.log(self.log_level, message, *args)
|
|
73
|
+
|
|
74
|
+
def on_request_complete(self) -> None:
|
|
75
|
+
"""Called after each request completes."""
|
|
76
|
+
if not self.enabled:
|
|
77
|
+
return
|
|
78
|
+
self.request_count += 1
|
|
79
|
+
if self.request_count % self.log_interval == 0:
|
|
80
|
+
self.log_memory_stats()
|
|
81
|
+
|
|
82
|
+
def _ensure_tracing(self) -> bool:
|
|
83
|
+
"""Ensure tracemalloc is running if we started it originally.
|
|
84
|
+
|
|
85
|
+
Returns:
|
|
86
|
+
True if tracemalloc is active, False otherwise
|
|
87
|
+
"""
|
|
88
|
+
if tracemalloc.is_tracing():
|
|
89
|
+
return True
|
|
90
|
+
|
|
91
|
+
# Only restart if we started it originally (respect external control)
|
|
92
|
+
if not self._we_started_tracemalloc:
|
|
93
|
+
return False
|
|
94
|
+
|
|
95
|
+
# Attempt to restart
|
|
96
|
+
try:
|
|
97
|
+
logger.warning("tracemalloc was stopped externally; restarting (we started it originally)")
|
|
98
|
+
tracemalloc.start()
|
|
99
|
+
|
|
100
|
+
# Reset baseline since old tracking data is lost
|
|
101
|
+
gc.collect()
|
|
102
|
+
self.baseline_snapshot = tracemalloc.take_snapshot()
|
|
103
|
+
logger.info("Baseline snapshot reset after tracemalloc restart")
|
|
104
|
+
|
|
105
|
+
return True
|
|
106
|
+
except RuntimeError as e:
|
|
107
|
+
logger.error("Failed to restart tracemalloc: %s", e)
|
|
108
|
+
return False
|
|
109
|
+
|
|
110
|
+
def _safe_traced_memory(self) -> tuple[float, float] | None:
|
|
111
|
+
"""Return (current, peak usage in MB) if tracemalloc is active, else None."""
|
|
112
|
+
if not self._ensure_tracing():
|
|
113
|
+
return None
|
|
114
|
+
|
|
115
|
+
try:
|
|
116
|
+
current, peak = tracemalloc.get_traced_memory()
|
|
117
|
+
megabyte = (1 << 20)
|
|
118
|
+
return (current / megabyte, peak / megabyte)
|
|
119
|
+
except RuntimeError:
|
|
120
|
+
return None
|
|
121
|
+
|
|
122
|
+
def _safe_snapshot(self) -> tracemalloc.Snapshot | None:
|
|
123
|
+
"""Return a tracemalloc Snapshot if available, else None."""
|
|
124
|
+
if not self._ensure_tracing():
|
|
125
|
+
return None
|
|
126
|
+
|
|
127
|
+
try:
|
|
128
|
+
return tracemalloc.take_snapshot()
|
|
129
|
+
except RuntimeError:
|
|
130
|
+
return None
|
|
131
|
+
|
|
132
|
+
def log_memory_stats(self) -> dict[str, Any]:
|
|
133
|
+
"""Log current memory statistics and return them."""
|
|
134
|
+
if not self.enabled:
|
|
135
|
+
return {}
|
|
136
|
+
|
|
137
|
+
# Force garbage collection first
|
|
138
|
+
gc.collect()
|
|
139
|
+
|
|
140
|
+
# Get current memory usage
|
|
141
|
+
mem = self._safe_traced_memory()
|
|
142
|
+
if mem is None:
|
|
143
|
+
logger.info("tracemalloc is not active; cannot collect memory stats.")
|
|
144
|
+
# still return structural fields
|
|
145
|
+
stats = {
|
|
146
|
+
"request_count": self.request_count,
|
|
147
|
+
"current_memory_mb": None,
|
|
148
|
+
"peak_memory_mb": None,
|
|
149
|
+
"active_intermediate_managers": self._safe_intermediate_step_manager_count(),
|
|
150
|
+
"outstanding_steps": self._safe_outstanding_step_count(),
|
|
151
|
+
"active_exporters": self._safe_exporter_count(),
|
|
152
|
+
"isolated_exporters": self._safe_isolated_exporter_count(),
|
|
153
|
+
"subject_instances": self._count_instances_of_type("Subject"),
|
|
154
|
+
}
|
|
155
|
+
return stats
|
|
156
|
+
|
|
157
|
+
current_mb, peak_mb = mem
|
|
158
|
+
|
|
159
|
+
# Take snapshot and compare to baseline
|
|
160
|
+
snapshot = self._safe_snapshot()
|
|
161
|
+
|
|
162
|
+
# Track BaseExporter instances (observability layer)
|
|
163
|
+
exporter_count = self._safe_exporter_count()
|
|
164
|
+
isolated_exporter_count = self._safe_isolated_exporter_count()
|
|
165
|
+
|
|
166
|
+
# Track Subject instances (event streams)
|
|
167
|
+
subject_count = self._count_instances_of_type("Subject")
|
|
168
|
+
|
|
169
|
+
stats = {
|
|
170
|
+
"request_count": self.request_count,
|
|
171
|
+
"current_memory_mb": round(current_mb, 2),
|
|
172
|
+
"peak_memory_mb": round(peak_mb, 2),
|
|
173
|
+
"active_intermediate_managers": self._safe_intermediate_step_manager_count(),
|
|
174
|
+
"outstanding_steps": self._safe_outstanding_step_count(),
|
|
175
|
+
"active_exporters": exporter_count,
|
|
176
|
+
"isolated_exporters": isolated_exporter_count,
|
|
177
|
+
"subject_instances": subject_count,
|
|
178
|
+
}
|
|
179
|
+
|
|
180
|
+
self._log("=" * 80)
|
|
181
|
+
self._log("MEMORY PROFILE AFTER %d REQUESTS:", self.request_count)
|
|
182
|
+
self._log(" Current Memory: %.2f MB", current_mb)
|
|
183
|
+
self._log(" Peak Memory: %.2f MB", peak_mb)
|
|
184
|
+
self._log("")
|
|
185
|
+
self._log("NAT COMPONENT INSTANCES:")
|
|
186
|
+
self._log(" IntermediateStepManagers: %d active (%d outstanding steps)",
|
|
187
|
+
stats["active_intermediate_managers"],
|
|
188
|
+
stats["outstanding_steps"])
|
|
189
|
+
self._log(" BaseExporters: %d active (%d isolated)", stats["active_exporters"], stats["isolated_exporters"])
|
|
190
|
+
self._log(" Subject (event streams): %d instances", stats["subject_instances"])
|
|
191
|
+
|
|
192
|
+
# Show top allocations
|
|
193
|
+
if snapshot is None:
|
|
194
|
+
self._log("tracemalloc snapshot unavailable.")
|
|
195
|
+
else:
|
|
196
|
+
if self.baseline_snapshot:
|
|
197
|
+
self._log("TOP %d MEMORY GROWTH SINCE BASELINE:", self.top_n)
|
|
198
|
+
top_stats = snapshot.compare_to(self.baseline_snapshot, 'lineno')
|
|
199
|
+
else:
|
|
200
|
+
self._log("TOP %d MEMORY ALLOCATIONS:", self.top_n)
|
|
201
|
+
top_stats = snapshot.statistics('lineno')
|
|
202
|
+
|
|
203
|
+
for i, stat in enumerate(top_stats[:self.top_n], 1):
|
|
204
|
+
self._log(" #%d: %s", i, stat)
|
|
205
|
+
|
|
206
|
+
self._log("=" * 80)
|
|
207
|
+
|
|
208
|
+
return stats
|
|
209
|
+
|
|
210
|
+
def _count_instances_of_type(self, type_name: str) -> int:
|
|
211
|
+
"""Count instances of a specific type in memory."""
|
|
212
|
+
count = 0
|
|
213
|
+
for obj in gc.get_objects():
|
|
214
|
+
try:
|
|
215
|
+
if type(obj).__name__ == type_name:
|
|
216
|
+
count += 1
|
|
217
|
+
except Exception:
|
|
218
|
+
pass
|
|
219
|
+
return count
|
|
220
|
+
|
|
221
|
+
def _safe_exporter_count(self) -> int:
|
|
222
|
+
try:
|
|
223
|
+
from nat.observability.exporter.base_exporter import BaseExporter
|
|
224
|
+
return BaseExporter.get_active_instance_count()
|
|
225
|
+
except Exception as e:
|
|
226
|
+
logger.debug("Could not get BaseExporter stats: %s", e)
|
|
227
|
+
return 0
|
|
228
|
+
|
|
229
|
+
def _safe_isolated_exporter_count(self) -> int:
|
|
230
|
+
try:
|
|
231
|
+
from nat.observability.exporter.base_exporter import BaseExporter
|
|
232
|
+
return BaseExporter.get_isolated_instance_count()
|
|
233
|
+
except Exception:
|
|
234
|
+
return 0
|
|
235
|
+
|
|
236
|
+
def _safe_intermediate_step_manager_count(self) -> int:
|
|
237
|
+
try:
|
|
238
|
+
from nat.builder.intermediate_step_manager import IntermediateStepManager
|
|
239
|
+
# len() is atomic in CPython, but catch RuntimeError just in case
|
|
240
|
+
try:
|
|
241
|
+
return IntermediateStepManager.get_active_instance_count()
|
|
242
|
+
except RuntimeError:
|
|
243
|
+
# Set was modified during len() - very rare
|
|
244
|
+
logger.debug("Set changed during count, returning 0")
|
|
245
|
+
return 0
|
|
246
|
+
except Exception as e:
|
|
247
|
+
logger.debug("Could not get IntermediateStepManager stats: %s", e)
|
|
248
|
+
return 0
|
|
249
|
+
|
|
250
|
+
def _safe_outstanding_step_count(self) -> int:
|
|
251
|
+
"""Get total outstanding steps across all active IntermediateStepManager instances."""
|
|
252
|
+
try:
|
|
253
|
+
from nat.builder.intermediate_step_manager import IntermediateStepManager
|
|
254
|
+
|
|
255
|
+
# Make a snapshot to avoid "Set changed size during iteration" if GC runs
|
|
256
|
+
try:
|
|
257
|
+
instances_snapshot = list(IntermediateStepManager._active_instances)
|
|
258
|
+
except RuntimeError:
|
|
259
|
+
# Set changed during list() call - rare but possible
|
|
260
|
+
logger.debug("Set changed during snapshot, returning 0 for outstanding steps")
|
|
261
|
+
return 0
|
|
262
|
+
|
|
263
|
+
total_outstanding = 0
|
|
264
|
+
# Iterate through snapshot safely
|
|
265
|
+
for ref in instances_snapshot:
|
|
266
|
+
try:
|
|
267
|
+
manager = ref()
|
|
268
|
+
if manager is not None:
|
|
269
|
+
total_outstanding += manager.get_outstanding_step_count()
|
|
270
|
+
except (ReferenceError, AttributeError):
|
|
271
|
+
# Manager was GC'd or in invalid state - skip it
|
|
272
|
+
continue
|
|
273
|
+
return total_outstanding
|
|
274
|
+
except Exception as e:
|
|
275
|
+
logger.debug("Could not get outstanding step count: %s", e)
|
|
276
|
+
return 0
|
|
277
|
+
|
|
278
|
+
def get_stats(self) -> dict[str, Any]:
|
|
279
|
+
"""Get current memory statistics without logging."""
|
|
280
|
+
if not self.enabled:
|
|
281
|
+
return {"enabled": False}
|
|
282
|
+
|
|
283
|
+
mem = self._safe_traced_memory()
|
|
284
|
+
if mem is None:
|
|
285
|
+
return {
|
|
286
|
+
"enabled": True,
|
|
287
|
+
"request_count": self.request_count,
|
|
288
|
+
"current_memory_mb": None,
|
|
289
|
+
"peak_memory_mb": None,
|
|
290
|
+
"active_intermediate_managers": self._safe_intermediate_step_manager_count(),
|
|
291
|
+
"outstanding_steps": self._safe_outstanding_step_count(),
|
|
292
|
+
"active_exporters": self._safe_exporter_count(),
|
|
293
|
+
"isolated_exporters": self._safe_isolated_exporter_count(),
|
|
294
|
+
"subject_instances": self._count_instances_of_type("Subject"),
|
|
295
|
+
}
|
|
296
|
+
|
|
297
|
+
current_mb, peak_mb = mem
|
|
298
|
+
return {
|
|
299
|
+
"enabled": True,
|
|
300
|
+
"request_count": self.request_count,
|
|
301
|
+
"current_memory_mb": round(current_mb, 2),
|
|
302
|
+
"peak_memory_mb": round(peak_mb, 2),
|
|
303
|
+
"active_intermediate_managers": self._safe_intermediate_step_manager_count(),
|
|
304
|
+
"outstanding_steps": self._safe_outstanding_step_count(),
|
|
305
|
+
"active_exporters": self._safe_exporter_count(),
|
|
306
|
+
"isolated_exporters": self._safe_isolated_exporter_count(),
|
|
307
|
+
"subject_instances": self._count_instances_of_type("Subject"),
|
|
308
|
+
}
|
|
309
|
+
|
|
310
|
+
def reset_baseline(self) -> None:
|
|
311
|
+
"""Reset the baseline snapshot to current state."""
|
|
312
|
+
if not self.enabled:
|
|
313
|
+
return
|
|
314
|
+
gc.collect()
|
|
315
|
+
snap = self._safe_snapshot()
|
|
316
|
+
if snap is None:
|
|
317
|
+
logger.info("Cannot reset baseline: tracemalloc is not active.")
|
|
318
|
+
return
|
|
319
|
+
self.baseline_snapshot = snap
|
|
320
|
+
logger.info("Memory profiling baseline reset at request %d", self.request_count)
|
|
@@ -0,0 +1,27 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from collections.abc import AsyncIterator
|
|
17
|
+
|
|
18
|
+
from nat.cli.register_workflow import register_front_end
|
|
19
|
+
from nat.data_models.config import Config
|
|
20
|
+
from nat.front_ends.mcp.mcp_front_end_config import MCPFrontEndConfig
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
@register_front_end(config_type=MCPFrontEndConfig)
|
|
24
|
+
async def register_mcp_front_end(config: MCPFrontEndConfig, full_config: Config) -> AsyncIterator:
|
|
25
|
+
from nat.front_ends.mcp.mcp_front_end_plugin import MCPFrontEndPlugin
|
|
26
|
+
|
|
27
|
+
yield MCPFrontEndPlugin(full_config=full_config)
|