PyPI - nvidia-nat - Versions diffs - 1.2.0rc5__py3-none-any.whl - Mend

nvidia-nat 1.2.0rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (435) hide show

aiq/agent/__init__.py +0 -0
aiq/agent/base.py +239 -0
aiq/agent/dual_node.py +67 -0
aiq/agent/react_agent/__init__.py +0 -0
aiq/agent/react_agent/agent.py +355 -0
aiq/agent/react_agent/output_parser.py +104 -0
aiq/agent/react_agent/prompt.py +41 -0
aiq/agent/react_agent/register.py +149 -0
aiq/agent/reasoning_agent/__init__.py +0 -0
aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
aiq/agent/register.py +23 -0
aiq/agent/rewoo_agent/__init__.py +0 -0
aiq/agent/rewoo_agent/agent.py +411 -0
aiq/agent/rewoo_agent/prompt.py +108 -0
aiq/agent/rewoo_agent/register.py +158 -0
aiq/agent/tool_calling_agent/__init__.py +0 -0
aiq/agent/tool_calling_agent/agent.py +119 -0
aiq/agent/tool_calling_agent/register.py +106 -0
aiq/authentication/__init__.py +14 -0
aiq/authentication/api_key/__init__.py +14 -0
aiq/authentication/api_key/api_key_auth_provider.py +96 -0
aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
aiq/authentication/api_key/register.py +26 -0
aiq/authentication/exceptions/__init__.py +14 -0
aiq/authentication/exceptions/api_key_exceptions.py +38 -0
aiq/authentication/http_basic_auth/__init__.py +0 -0
aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
aiq/authentication/http_basic_auth/register.py +30 -0
aiq/authentication/interfaces.py +93 -0
aiq/authentication/oauth2/__init__.py +14 -0
aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
aiq/authentication/oauth2/register.py +25 -0
aiq/authentication/register.py +21 -0
aiq/builder/__init__.py +0 -0
aiq/builder/builder.py +285 -0
aiq/builder/component_utils.py +316 -0
aiq/builder/context.py +264 -0
aiq/builder/embedder.py +24 -0
aiq/builder/eval_builder.py +161 -0
aiq/builder/evaluator.py +29 -0
aiq/builder/framework_enum.py +24 -0
aiq/builder/front_end.py +73 -0
aiq/builder/function.py +344 -0
aiq/builder/function_base.py +380 -0
aiq/builder/function_info.py +627 -0
aiq/builder/intermediate_step_manager.py +174 -0
aiq/builder/llm.py +25 -0
aiq/builder/retriever.py +25 -0
aiq/builder/user_interaction_manager.py +74 -0
aiq/builder/workflow.py +148 -0
aiq/builder/workflow_builder.py +1117 -0
aiq/cli/__init__.py +14 -0
aiq/cli/cli_utils/__init__.py +0 -0
aiq/cli/cli_utils/config_override.py +231 -0
aiq/cli/cli_utils/validation.py +37 -0
aiq/cli/commands/__init__.py +0 -0
aiq/cli/commands/configure/__init__.py +0 -0
aiq/cli/commands/configure/channel/__init__.py +0 -0
aiq/cli/commands/configure/channel/add.py +28 -0
aiq/cli/commands/configure/channel/channel.py +36 -0
aiq/cli/commands/configure/channel/remove.py +30 -0
aiq/cli/commands/configure/channel/update.py +30 -0
aiq/cli/commands/configure/configure.py +33 -0
aiq/cli/commands/evaluate.py +139 -0
aiq/cli/commands/info/__init__.py +14 -0
aiq/cli/commands/info/info.py +39 -0
aiq/cli/commands/info/list_channels.py +32 -0
aiq/cli/commands/info/list_components.py +129 -0
aiq/cli/commands/info/list_mcp.py +213 -0
aiq/cli/commands/registry/__init__.py +14 -0
aiq/cli/commands/registry/publish.py +88 -0
aiq/cli/commands/registry/pull.py +118 -0
aiq/cli/commands/registry/registry.py +38 -0
aiq/cli/commands/registry/remove.py +108 -0
aiq/cli/commands/registry/search.py +155 -0
aiq/cli/commands/sizing/__init__.py +14 -0
aiq/cli/commands/sizing/calc.py +297 -0
aiq/cli/commands/sizing/sizing.py +27 -0
aiq/cli/commands/start.py +246 -0
aiq/cli/commands/uninstall.py +81 -0
aiq/cli/commands/validate.py +47 -0
aiq/cli/commands/workflow/__init__.py +14 -0
aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
aiq/cli/commands/workflow/workflow.py +37 -0
aiq/cli/commands/workflow/workflow_commands.py +313 -0
aiq/cli/entrypoint.py +135 -0
aiq/cli/main.py +44 -0
aiq/cli/register_workflow.py +488 -0
aiq/cli/type_registry.py +1000 -0
aiq/data_models/__init__.py +14 -0
aiq/data_models/api_server.py +694 -0
aiq/data_models/authentication.py +231 -0
aiq/data_models/common.py +171 -0
aiq/data_models/component.py +54 -0
aiq/data_models/component_ref.py +168 -0
aiq/data_models/config.py +406 -0
aiq/data_models/dataset_handler.py +123 -0
aiq/data_models/discovery_metadata.py +335 -0
aiq/data_models/embedder.py +27 -0
aiq/data_models/evaluate.py +127 -0
aiq/data_models/evaluator.py +26 -0
aiq/data_models/front_end.py +26 -0
aiq/data_models/function.py +30 -0
aiq/data_models/function_dependencies.py +72 -0
aiq/data_models/interactive.py +246 -0
aiq/data_models/intermediate_step.py +302 -0
aiq/data_models/invocation_node.py +38 -0
aiq/data_models/llm.py +27 -0
aiq/data_models/logging.py +26 -0
aiq/data_models/memory.py +27 -0
aiq/data_models/object_store.py +44 -0
aiq/data_models/profiler.py +54 -0
aiq/data_models/registry_handler.py +26 -0
aiq/data_models/retriever.py +30 -0
aiq/data_models/retry_mixin.py +35 -0
aiq/data_models/span.py +187 -0
aiq/data_models/step_adaptor.py +64 -0
aiq/data_models/streaming.py +33 -0
aiq/data_models/swe_bench_model.py +54 -0
aiq/data_models/telemetry_exporter.py +26 -0
aiq/data_models/ttc_strategy.py +30 -0
aiq/embedder/__init__.py +0 -0
aiq/embedder/langchain_client.py +41 -0
aiq/embedder/nim_embedder.py +59 -0
aiq/embedder/openai_embedder.py +43 -0
aiq/embedder/register.py +24 -0
aiq/eval/__init__.py +14 -0
aiq/eval/config.py +60 -0
aiq/eval/dataset_handler/__init__.py +0 -0
aiq/eval/dataset_handler/dataset_downloader.py +106 -0
aiq/eval/dataset_handler/dataset_filter.py +52 -0
aiq/eval/dataset_handler/dataset_handler.py +254 -0
aiq/eval/evaluate.py +506 -0
aiq/eval/evaluator/__init__.py +14 -0
aiq/eval/evaluator/base_evaluator.py +73 -0
aiq/eval/evaluator/evaluator_model.py +45 -0
aiq/eval/intermediate_step_adapter.py +99 -0
aiq/eval/rag_evaluator/__init__.py +0 -0
aiq/eval/rag_evaluator/evaluate.py +178 -0
aiq/eval/rag_evaluator/register.py +143 -0
aiq/eval/register.py +23 -0
aiq/eval/remote_workflow.py +133 -0
aiq/eval/runners/__init__.py +14 -0
aiq/eval/runners/config.py +39 -0
aiq/eval/runners/multi_eval_runner.py +54 -0
aiq/eval/runtime_event_subscriber.py +52 -0
aiq/eval/swe_bench_evaluator/__init__.py +0 -0
aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
aiq/eval/swe_bench_evaluator/register.py +36 -0
aiq/eval/trajectory_evaluator/__init__.py +0 -0
aiq/eval/trajectory_evaluator/evaluate.py +75 -0
aiq/eval/trajectory_evaluator/register.py +40 -0
aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
aiq/eval/tunable_rag_evaluator/register.py +52 -0
aiq/eval/usage_stats.py +41 -0
aiq/eval/utils/__init__.py +0 -0
aiq/eval/utils/output_uploader.py +140 -0
aiq/eval/utils/tqdm_position_registry.py +40 -0
aiq/eval/utils/weave_eval.py +184 -0
aiq/experimental/__init__.py +0 -0
aiq/experimental/decorators/__init__.py +0 -0
aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
aiq/experimental/test_time_compute/__init__.py +0 -0
aiq/experimental/test_time_compute/editing/__init__.py +0 -0
aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
aiq/experimental/test_time_compute/functions/__init__.py +0 -0
aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
aiq/experimental/test_time_compute/models/__init__.py +0 -0
aiq/experimental/test_time_compute/models/editor_config.py +132 -0
aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
aiq/experimental/test_time_compute/models/search_config.py +120 -0
aiq/experimental/test_time_compute/models/selection_config.py +154 -0
aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
aiq/experimental/test_time_compute/register.py +36 -0
aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
aiq/experimental/test_time_compute/search/__init__.py +0 -0
aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
aiq/experimental/test_time_compute/selection/__init__.py +0 -0
aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
aiq/front_ends/__init__.py +14 -0
aiq/front_ends/console/__init__.py +14 -0
aiq/front_ends/console/authentication_flow_handler.py +233 -0
aiq/front_ends/console/console_front_end_config.py +32 -0
aiq/front_ends/console/console_front_end_plugin.py +96 -0
aiq/front_ends/console/register.py +25 -0
aiq/front_ends/cron/__init__.py +14 -0
aiq/front_ends/fastapi/__init__.py +14 -0
aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
aiq/front_ends/fastapi/job_store.py +183 -0
aiq/front_ends/fastapi/main.py +72 -0
aiq/front_ends/fastapi/message_handler.py +298 -0
aiq/front_ends/fastapi/message_validator.py +345 -0
aiq/front_ends/fastapi/register.py +25 -0
aiq/front_ends/fastapi/response_helpers.py +195 -0
aiq/front_ends/fastapi/step_adaptor.py +321 -0
aiq/front_ends/mcp/__init__.py +14 -0
aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
aiq/front_ends/mcp/register.py +27 -0
aiq/front_ends/mcp/tool_converter.py +242 -0
aiq/front_ends/register.py +22 -0
aiq/front_ends/simple_base/__init__.py +14 -0
aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
aiq/llm/__init__.py +0 -0
aiq/llm/aws_bedrock_llm.py +57 -0
aiq/llm/nim_llm.py +46 -0
aiq/llm/openai_llm.py +46 -0
aiq/llm/register.py +23 -0
aiq/llm/utils/__init__.py +14 -0
aiq/llm/utils/env_config_value.py +94 -0
aiq/llm/utils/error.py +17 -0
aiq/memory/__init__.py +20 -0
aiq/memory/interfaces.py +183 -0
aiq/memory/models.py +112 -0
aiq/meta/module_to_distro.json +3 -0
aiq/meta/pypi.md +58 -0
aiq/object_store/__init__.py +20 -0
aiq/object_store/in_memory_object_store.py +76 -0
aiq/object_store/interfaces.py +84 -0
aiq/object_store/models.py +36 -0
aiq/object_store/register.py +20 -0
aiq/observability/__init__.py +14 -0
aiq/observability/exporter/__init__.py +14 -0
aiq/observability/exporter/base_exporter.py +449 -0
aiq/observability/exporter/exporter.py +78 -0
aiq/observability/exporter/file_exporter.py +33 -0
aiq/observability/exporter/processing_exporter.py +322 -0
aiq/observability/exporter/raw_exporter.py +52 -0
aiq/observability/exporter/span_exporter.py +265 -0
aiq/observability/exporter_manager.py +335 -0
aiq/observability/mixin/__init__.py +14 -0
aiq/observability/mixin/batch_config_mixin.py +26 -0
aiq/observability/mixin/collector_config_mixin.py +23 -0
aiq/observability/mixin/file_mixin.py +288 -0
aiq/observability/mixin/file_mode.py +23 -0
aiq/observability/mixin/resource_conflict_mixin.py +134 -0
aiq/observability/mixin/serialize_mixin.py +61 -0
aiq/observability/mixin/type_introspection_mixin.py +183 -0
aiq/observability/processor/__init__.py +14 -0
aiq/observability/processor/batching_processor.py +310 -0
aiq/observability/processor/callback_processor.py +42 -0
aiq/observability/processor/intermediate_step_serializer.py +28 -0
aiq/observability/processor/processor.py +71 -0
aiq/observability/register.py +96 -0
aiq/observability/utils/__init__.py +14 -0
aiq/observability/utils/dict_utils.py +236 -0
aiq/observability/utils/time_utils.py +31 -0
aiq/plugins/.namespace +1 -0
aiq/profiler/__init__.py +0 -0
aiq/profiler/calc/__init__.py +14 -0
aiq/profiler/calc/calc_runner.py +627 -0
aiq/profiler/calc/calculations.py +288 -0
aiq/profiler/calc/data_models.py +188 -0
aiq/profiler/calc/plot.py +345 -0
aiq/profiler/callbacks/__init__.py +0 -0
aiq/profiler/callbacks/agno_callback_handler.py +295 -0
aiq/profiler/callbacks/base_callback_class.py +20 -0
aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
aiq/profiler/callbacks/token_usage_base_model.py +27 -0
aiq/profiler/data_frame_row.py +51 -0
aiq/profiler/data_models.py +24 -0
aiq/profiler/decorators/__init__.py +0 -0
aiq/profiler/decorators/framework_wrapper.py +131 -0
aiq/profiler/decorators/function_tracking.py +254 -0
aiq/profiler/forecasting/__init__.py +0 -0
aiq/profiler/forecasting/config.py +18 -0
aiq/profiler/forecasting/model_trainer.py +75 -0
aiq/profiler/forecasting/models/__init__.py +22 -0
aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
aiq/profiler/forecasting/models/linear_model.py +196 -0
aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
aiq/profiler/inference_metrics_model.py +28 -0
aiq/profiler/inference_optimization/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
aiq/profiler/inference_optimization/data_models.py +386 -0
aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
aiq/profiler/inference_optimization/llm_metrics.py +212 -0
aiq/profiler/inference_optimization/prompt_caching.py +163 -0
aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
aiq/profiler/intermediate_property_adapter.py +102 -0
aiq/profiler/profile_runner.py +473 -0
aiq/profiler/utils.py +184 -0
aiq/registry_handlers/__init__.py +0 -0
aiq/registry_handlers/local/__init__.py +0 -0
aiq/registry_handlers/local/local_handler.py +176 -0
aiq/registry_handlers/local/register_local.py +37 -0
aiq/registry_handlers/metadata_factory.py +60 -0
aiq/registry_handlers/package_utils.py +567 -0
aiq/registry_handlers/pypi/__init__.py +0 -0
aiq/registry_handlers/pypi/pypi_handler.py +251 -0
aiq/registry_handlers/pypi/register_pypi.py +40 -0
aiq/registry_handlers/register.py +21 -0
aiq/registry_handlers/registry_handler_base.py +157 -0
aiq/registry_handlers/rest/__init__.py +0 -0
aiq/registry_handlers/rest/register_rest.py +56 -0
aiq/registry_handlers/rest/rest_handler.py +237 -0
aiq/registry_handlers/schemas/__init__.py +0 -0
aiq/registry_handlers/schemas/headers.py +42 -0
aiq/registry_handlers/schemas/package.py +68 -0
aiq/registry_handlers/schemas/publish.py +63 -0
aiq/registry_handlers/schemas/pull.py +82 -0
aiq/registry_handlers/schemas/remove.py +36 -0
aiq/registry_handlers/schemas/search.py +91 -0
aiq/registry_handlers/schemas/status.py +47 -0
aiq/retriever/__init__.py +0 -0
aiq/retriever/interface.py +37 -0
aiq/retriever/milvus/__init__.py +14 -0
aiq/retriever/milvus/register.py +81 -0
aiq/retriever/milvus/retriever.py +228 -0
aiq/retriever/models.py +74 -0
aiq/retriever/nemo_retriever/__init__.py +14 -0
aiq/retriever/nemo_retriever/register.py +60 -0
aiq/retriever/nemo_retriever/retriever.py +190 -0
aiq/retriever/register.py +22 -0
aiq/runtime/__init__.py +14 -0
aiq/runtime/loader.py +215 -0
aiq/runtime/runner.py +190 -0
aiq/runtime/session.py +158 -0
aiq/runtime/user_metadata.py +130 -0
aiq/settings/__init__.py +0 -0
aiq/settings/global_settings.py +318 -0
aiq/test/.namespace +1 -0
aiq/tool/__init__.py +0 -0
aiq/tool/chat_completion.py +74 -0
aiq/tool/code_execution/README.md +151 -0
aiq/tool/code_execution/__init__.py +0 -0
aiq/tool/code_execution/code_sandbox.py +267 -0
aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
aiq/tool/code_execution/register.py +74 -0
aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
aiq/tool/code_execution/utils.py +100 -0
aiq/tool/datetime_tools.py +42 -0
aiq/tool/document_search.py +141 -0
aiq/tool/github_tools/__init__.py +0 -0
aiq/tool/github_tools/create_github_commit.py +133 -0
aiq/tool/github_tools/create_github_issue.py +87 -0
aiq/tool/github_tools/create_github_pr.py +106 -0
aiq/tool/github_tools/get_github_file.py +106 -0
aiq/tool/github_tools/get_github_issue.py +166 -0
aiq/tool/github_tools/get_github_pr.py +256 -0
aiq/tool/github_tools/update_github_issue.py +100 -0
aiq/tool/mcp/__init__.py +14 -0
aiq/tool/mcp/exceptions.py +142 -0
aiq/tool/mcp/mcp_client.py +255 -0
aiq/tool/mcp/mcp_tool.py +96 -0
aiq/tool/memory_tools/__init__.py +0 -0
aiq/tool/memory_tools/add_memory_tool.py +79 -0
aiq/tool/memory_tools/delete_memory_tool.py +67 -0
aiq/tool/memory_tools/get_memory_tool.py +72 -0
aiq/tool/nvidia_rag.py +95 -0
aiq/tool/register.py +38 -0
aiq/tool/retriever.py +89 -0
aiq/tool/server_tools.py +66 -0
aiq/utils/__init__.py +0 -0
aiq/utils/data_models/__init__.py +0 -0
aiq/utils/data_models/schema_validator.py +58 -0
aiq/utils/debugging_utils.py +43 -0
aiq/utils/dump_distro_mapping.py +32 -0
aiq/utils/exception_handlers/__init__.py +0 -0
aiq/utils/exception_handlers/automatic_retries.py +289 -0
aiq/utils/exception_handlers/mcp.py +211 -0
aiq/utils/exception_handlers/schemas.py +114 -0
aiq/utils/io/__init__.py +0 -0
aiq/utils/io/model_processing.py +28 -0
aiq/utils/io/yaml_tools.py +119 -0
aiq/utils/log_utils.py +37 -0
aiq/utils/metadata_utils.py +74 -0
aiq/utils/optional_imports.py +142 -0
aiq/utils/producer_consumer_queue.py +178 -0
aiq/utils/reactive/__init__.py +0 -0
aiq/utils/reactive/base/__init__.py +0 -0
aiq/utils/reactive/base/observable_base.py +65 -0
aiq/utils/reactive/base/observer_base.py +55 -0
aiq/utils/reactive/base/subject_base.py +79 -0
aiq/utils/reactive/observable.py +59 -0
aiq/utils/reactive/observer.py +76 -0
aiq/utils/reactive/subject.py +131 -0
aiq/utils/reactive/subscription.py +49 -0
aiq/utils/settings/__init__.py +0 -0
aiq/utils/settings/global_settings.py +197 -0
aiq/utils/string_utils.py +38 -0
aiq/utils/type_converter.py +290 -0
aiq/utils/type_utils.py +484 -0
aiq/utils/url_utils.py +27 -0
nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0

aiq/profiler/inference_optimization/prompt_caching.py ADDED Viewed

@@ -0,0 +1,163 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from aiq.data_models.intermediate_step import IntermediateStep
+from aiq.profiler.inference_optimization.data_models import CommonPrefixesOutput
+from aiq.profiler.inference_optimization.data_models import FrameworkLLMPrefixData
+from aiq.profiler.inference_optimization.data_models import PrefixInfo
+from aiq.profiler.utils import create_standardized_dataframe
+# -----------------------------------------------------------
+# 1. Helper: Build a prefix trie
+# -----------------------------------------------------------
+def build_prefix_trie(strings: list[str]) -> dict:
+    """
+    Build a trie from a list of strings.
+    Returns a nested dictionary with::
+        {
+            'count': int,         # number of strings passing through this node
+            'children': dict[str, TrieNode]
+        }
+    """
+    root = {'count': 0, 'children': {}}
+    for s in strings:
+        node = root
+        node['count'] += 1  # every string passes through the root
+        for ch in s:
+            if ch not in node['children']:
+                node['children'][ch] = {'count': 0, 'children': {}}
+            node = node['children'][ch]
+            node['count'] += 1
+    return root
+# -----------------------------------------------------------
+# 2. Helper: Iterative traversal of the trie
+# -----------------------------------------------------------
+def collect_prefixes_iterative(root: dict, total_calls: int) -> list[dict]:
+    """
+    Iteratively traverse the trie to collect prefix statistics,
+    avoiding recursion depth limits.
+    :param root: Trie node with 'count' and 'children'
+    :param total_calls: Number of total calls in this group (denominator for percentages)
+    :return: A list of dicts, each dict containing prefix info
+    """
+    results = []
+    # stack holds (node, prefix_so_far)
+    stack = [(root, "")]
+    while stack:
+        node, prefix = stack.pop()
+        # Skip storing the empty root prefix
+        if prefix:
+            calls_count = node['count']
+            calls_percentage = calls_count / total_calls
+            results.append({
+                'prefix': prefix,
+                'prefix_length': len(prefix),
+                'calls_count': calls_count,
+                'calls_percentage': calls_percentage
+            })
+        # Add children to the stack
+        for ch, child_node in node['children'].items():
+            stack.append((child_node, prefix + ch))
+    return results
+# -----------------------------------------------------------
+# 3. Main Function
+# -----------------------------------------------------------
+def get_common_prefixes(all_steps: list[list[IntermediateStep]],
+                        min_call_percentage: float = 0.0) -> CommonPrefixesOutput:
+    """
+    Given a pandas DataFrame with columns 'framework', 'llm_name',
+    and 'llm_text_input', return a Pydantic-validated RootModel
+    keyed by "<llm_name>" with a sorted list of
+    common prefix statistics.
+    1) Only includes prefixes with calls_percentage >= `min_call_percentage`.
+    2) Excludes any prefix that is a substring of another (longer) prefix
+       that already meets the threshold and is retained.
+    3) Optionally writes the resulting dictionary to JSON if `output_path` is provided.
+    :param all_steps: Intermediate Steps
+    :param min_call_percentage: Exclude prefixes that appear in fewer than this fraction
+                                of total calls. (Default 0.0 = no filtering)
+    Sorting: primarily by prefix length (descending),
+             secondarily by frequency (descending).
+    """
+    # Validate necessary columns
+    df = create_standardized_dataframe(all_steps)
+    required_cols = {'framework', 'llm_name', 'llm_text_input'}
+    if not required_cols.issubset(df.columns):
+        missing = required_cols - set(df.columns)
+        raise ValueError(f"DataFrame missing required columns: {missing}")
+    output_data: dict[str, FrameworkLLMPrefixData] = {}
+    # Group DataFrame by (framework, llm_name)
+    grouped = df.groupby(['llm_name'])
+    for llm_name, group_df in grouped:
+        # Unpack llm_name Tuple
+        llm_name = llm_name[0]
+        text_inputs = group_df['llm_text_input'].astype(str).tolist()
+        total_calls = len(text_inputs)
+        # Build trie for all text inputs
+        trie = build_prefix_trie(text_inputs)
+        # Collect prefix info using iterative traversal
+        results = collect_prefixes_iterative(trie, total_calls=total_calls)
+        # 1) Filter out prefixes below min_call_percentage
+        results_filtered = [r for r in results if r['calls_percentage'] >= min_call_percentage]
+        # 2) Sort results: prefix_length desc, then calls_count desc
+        results_sorted = sorted(results_filtered, key=lambda x: (x['prefix_length'], x['calls_count']), reverse=True)
+        # 3) Substring filtering:
+        #    Because results_sorted is in descending length order,
+        #    if we keep a prefix, we exclude any shorter prefix that
+        #    is a substring of that already-kept prefix.
+        final_results = []
+        for r in results_sorted:
+            pfx = r['prefix']
+            # Check if this prefix is contained in any longer prefix we have kept
+            if not any(pfx in kept['prefix'] for kept in final_results):
+                final_results.append(r)
+        # Convert each dict to a PrefixInfo model
+        prefix_info_list = [PrefixInfo(**res) for res in final_results]
+        # Construct the dictionary key
+        framework_llm_key = f"{llm_name}"
+        # Save the data for this group
+        output_data[framework_llm_key] = FrameworkLLMPrefixData(total_calls=total_calls, prefix_info=prefix_info_list)
+    # Package the final result in a validated RootModel
+    result_model = CommonPrefixesOutput(root=output_data)
+    return result_model

aiq/profiler/inference_optimization/token_uniqueness.py ADDED Viewed

@@ -0,0 +1,107 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import re
+import numpy as np
+from aiq.data_models.intermediate_step import IntermediateStep
+from aiq.profiler.inference_optimization.data_models import LLMUniquenessMetrics
+from aiq.profiler.inference_optimization.data_models import LLMUniquenessMetricsByLLM
+from aiq.profiler.utils import create_standardized_dataframe
+# ----------------------------------------------------------------
+# 1. Main Function
+# ----------------------------------------------------------------
+def compute_inter_query_token_uniqueness_by_llm(all_steps: list[list[IntermediateStep]]) -> LLMUniquenessMetricsByLLM:
+    """
+    Computes p90, p95, and p99 of 'new words added' between consecutive llm_start events,
+    grouped by (llm_name, example_number).
+    Steps:
+    1. Filter df to only llm_start events.
+    2. Group first by (llm_name, example_number), then sort by event_timestamp in each group.
+    3. Compare each llm_text_input to the previous one in the same group to find how many new words appear.
+    4. Aggregate all 'new words count' across each llm_name, compute p90/p95/p99 for each LLM.
+    5. Return a Pydantic RootModel containing a dictionary::
+         { llm_name -> LLMUniquenessMetrics(p90, p95, p99) }.
+    """
+    df = create_standardized_dataframe(all_steps)
+    # Validate that the necessary columns exist
+    required_cols = {'event_type', 'llm_name', 'example_number', 'event_timestamp', 'llm_text_input'}
+    missing = required_cols - set(df.columns)
+    if missing:
+        raise ValueError(f"DataFrame missing required columns: {missing}")
+    # 1) Filter to llm_start events
+    cdf = df[df['event_type'] == 'LLM_START'].copy()
+    if cdf.empty:
+        # Return an empty dictionary if no llm_start events
+        return LLMUniquenessMetricsByLLM(root={})
+    # Helper to tokenize text into a set of words
+    def tokenize_to_set(text: str) -> set:
+        if not isinstance(text, str):
+            return set()
+        return set(re.findall(r"\w+", text.lower()))
+    # We'll store new_words counts for each llm_name
+    llm_to_counts: dict[str, list[int]] = {}
+    # 2) Group by (llm_name, example_number), then sort each group
+    grouped = cdf.groupby(['llm_name', 'example_number'], as_index=False, group_keys=True)
+    for (llm, ex_num), group_df in grouped:  # pylint: disable=unused-variable
+        # Sort by event_timestamp
+        group_df = group_df.sort_values('event_timestamp', ascending=True)
+        # Shift the llm_text_input to compare consecutive calls
+        group_df['prev_llm_text_input'] = group_df['llm_text_input'].shift(1)
+        # Compute new words for each row (excluding the first in the group)
+        def compute_new_words(row):
+            current_tokens = tokenize_to_set(row['llm_text_input'])
+            prev_tokens = tokenize_to_set(row['prev_llm_text_input'])
+            return len(current_tokens - prev_tokens)
+        group_df['new_words_count'] = group_df.apply(compute_new_words, axis=1)
+        # Drop rows where there's no 'previous' call
+        valid_rows = group_df.dropna(subset=['prev_llm_text_input'])
+        # Gather the new_words_count
+        counts = valid_rows['new_words_count'].tolist()
+        if counts:
+            # Accumulate them in llm_to_counts
+            if llm not in llm_to_counts:
+                llm_to_counts[llm] = []
+            llm_to_counts[llm].extend(counts)
+    # 4) For each llm_name, compute p90, p95, p99
+    output_dict = {}
+    for llm_name, counts_list in llm_to_counts.items():
+        arr = np.array(counts_list)
+        p90_val = float(np.percentile(arr, 90))
+        p95_val = float(np.percentile(arr, 95))
+        p99_val = float(np.percentile(arr, 99))
+        output_dict[llm_name] = LLMUniquenessMetrics(p90=p90_val, p95=p95_val, p99=p99_val)
+    ret_val = LLMUniquenessMetricsByLLM(root=output_dict)
+    # Validate & return as a RootModel
+    return ret_val

aiq/profiler/inference_optimization/workflow_runtimes.py ADDED Viewed

@@ -0,0 +1,72 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import numpy as np
+from aiq.data_models.intermediate_step import IntermediateStep
+from aiq.profiler.inference_optimization.data_models import WorkflowRuntimeMetrics
+from aiq.profiler.utils import create_standardized_dataframe
+def compute_workflow_runtime_metrics(all_steps: list[list[IntermediateStep]]) -> WorkflowRuntimeMetrics:
+    """
+    Computes the p90, p95, and p99 of workflow runtime for each example_number.
+    The 'workflow runtime' per example is::
+        max(event_timestamp) - min(event_timestamp)
+    for that example_number.
+    Parameters
+    ----------
+    all_steps : IntermediateStep
+        Must contain at least two columns:
+          - 'example_number'
+          - 'event_timestamp'
+    Returns
+    -------
+    WorkflowRuntimeMetrics
+        A Pydantic model with 'p90', 'p95', and 'p99' attributes.
+    """
+    df = create_standardized_dataframe(all_steps)
+    required_cols = {"example_number", "event_timestamp"}
+    missing = required_cols - set(df.columns)
+    if missing:
+        raise ValueError(f"DataFrame is missing required columns: {missing}")
+    # Group by example_number, then find min and max timestamp
+    grouped = df.groupby("example_number")["event_timestamp"]
+    min_timestamps = grouped.min()
+    max_timestamps = grouped.max()
+    # Workflow runtime is difference between max and min
+    runtimes = max_timestamps - min_timestamps
+    # Convert to a NumPy array for percentile calculations
+    runtimes_arr = runtimes.values
+    # Edge case: if there's only one example or no data
+    # (NumPy percentile can handle 1-element arrays, but let's guard for empties)
+    if len(runtimes_arr) == 0:
+        return WorkflowRuntimeMetrics(p90=0.0, p95=0.0, p99=0.0)
+    # Compute p90, p95, p99
+    p90_val = float(np.percentile(runtimes_arr, 90))
+    p95_val = float(np.percentile(runtimes_arr, 95))
+    p99_val = float(np.percentile(runtimes_arr, 99))
+    return WorkflowRuntimeMetrics(p90=p90_val, p95=p95_val, p99=p99_val)

aiq/profiler/intermediate_property_adapter.py ADDED Viewed

@@ -0,0 +1,102 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from aiq.data_models.intermediate_step import IntermediateStep
+from aiq.data_models.intermediate_step import IntermediateStepType
+from aiq.data_models.intermediate_step import TokenUsageBaseModel
+class IntermediatePropertyAdaptor(IntermediateStep):
+    @classmethod
+    def from_intermediate_step(cls, step: IntermediateStep) -> "IntermediatePropertyAdaptor":
+        """
+        Create an adaptor instance from an existing IntermediateStep.
+        Uses the dict() representation of the instance to initialize the adaptor.
+        """
+        return cls(**step.model_dump())
+    @property
+    def token_usage(self) -> TokenUsageBaseModel:
+        return self.payload.usage_info.token_usage if self.payload.usage_info else TokenUsageBaseModel()
+    @property
+    def seconds_between_calls(self) -> int:
+        return self.payload.usage_info.seconds_between_calls if self.payload.usage_info else 0
+    @property
+    def llm_text_input(self) -> str:
+        ret = ""
+        if self.payload.data and self.event_type == IntermediateStepType.LLM_START:
+            ret = self.payload.data.input
+        return ret
+    @property
+    def llm_text_output(self) -> str:
+        ret = ""
+        if self.payload.data and self.event_type == IntermediateStepType.LLM_END:
+            ret = self.payload.data.output
+        return ret
+    @property
+    def llm_text_chunk(self) -> str:
+        ret = ""
+        if self.payload.data and self.event_type == IntermediateStepType.LLM_NEW_TOKEN:
+            ret = self.payload.data.chunk
+        return ret
+    @property
+    def tool_input(self) -> str:
+        ret = ""
+        if self.payload.data and self.event_type == IntermediateStepType.TOOL_START:
+            ret = self.payload.data.input
+        return ret
+    @property
+    def tool_output(self) -> str:
+        ret = ""
+        if self.payload.data and self.event_type == IntermediateStepType.TOOL_END:
+            ret = self.payload.data.output
+        return ret
+    @property
+    def llm_name(self) -> str:
+        ret = ""
+        if self.payload.name and self.event_type in [IntermediateStepType.LLM_START, IntermediateStepType.LLM_END]:
+            ret = self.payload.name
+        return ret
+    @property
+    def tool_name(self) -> str:
+        ret = ""
+        if self.payload.name and self.event_type in [IntermediateStepType.TOOL_START, IntermediateStepType.TOOL_END]:
+            ret = self.payload.name
+        return ret
+    @property
+    def function_name(self) -> str:
+        return self.function_ancestry.function_name
+    @property
+    def function_id(self) -> str:
+        return self.function_ancestry.function_id
+    @property
+    def parent_function_id(self) -> str:
+        return self.function_ancestry.parent_id
+    @property
+    def parent_function_name(self) -> str:
+        return self.function_ancestry.parent_name