nvidia-nat 1.2.0rc5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +239 -0
- aiq/agent/dual_node.py +67 -0
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +355 -0
- aiq/agent/react_agent/output_parser.py +104 -0
- aiq/agent/react_agent/prompt.py +41 -0
- aiq/agent/react_agent/register.py +149 -0
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
- aiq/agent/register.py +23 -0
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +411 -0
- aiq/agent/rewoo_agent/prompt.py +108 -0
- aiq/agent/rewoo_agent/register.py +158 -0
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +119 -0
- aiq/agent/tool_calling_agent/register.py +106 -0
- aiq/authentication/__init__.py +14 -0
- aiq/authentication/api_key/__init__.py +14 -0
- aiq/authentication/api_key/api_key_auth_provider.py +96 -0
- aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
- aiq/authentication/api_key/register.py +26 -0
- aiq/authentication/exceptions/__init__.py +14 -0
- aiq/authentication/exceptions/api_key_exceptions.py +38 -0
- aiq/authentication/http_basic_auth/__init__.py +0 -0
- aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- aiq/authentication/http_basic_auth/register.py +30 -0
- aiq/authentication/interfaces.py +93 -0
- aiq/authentication/oauth2/__init__.py +14 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- aiq/authentication/oauth2/register.py +25 -0
- aiq/authentication/register.py +21 -0
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +285 -0
- aiq/builder/component_utils.py +316 -0
- aiq/builder/context.py +264 -0
- aiq/builder/embedder.py +24 -0
- aiq/builder/eval_builder.py +161 -0
- aiq/builder/evaluator.py +29 -0
- aiq/builder/framework_enum.py +24 -0
- aiq/builder/front_end.py +73 -0
- aiq/builder/function.py +344 -0
- aiq/builder/function_base.py +380 -0
- aiq/builder/function_info.py +627 -0
- aiq/builder/intermediate_step_manager.py +174 -0
- aiq/builder/llm.py +25 -0
- aiq/builder/retriever.py +25 -0
- aiq/builder/user_interaction_manager.py +74 -0
- aiq/builder/workflow.py +148 -0
- aiq/builder/workflow_builder.py +1117 -0
- aiq/cli/__init__.py +14 -0
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +231 -0
- aiq/cli/cli_utils/validation.py +37 -0
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +28 -0
- aiq/cli/commands/configure/channel/channel.py +36 -0
- aiq/cli/commands/configure/channel/remove.py +30 -0
- aiq/cli/commands/configure/channel/update.py +30 -0
- aiq/cli/commands/configure/configure.py +33 -0
- aiq/cli/commands/evaluate.py +139 -0
- aiq/cli/commands/info/__init__.py +14 -0
- aiq/cli/commands/info/info.py +39 -0
- aiq/cli/commands/info/list_channels.py +32 -0
- aiq/cli/commands/info/list_components.py +129 -0
- aiq/cli/commands/info/list_mcp.py +213 -0
- aiq/cli/commands/registry/__init__.py +14 -0
- aiq/cli/commands/registry/publish.py +88 -0
- aiq/cli/commands/registry/pull.py +118 -0
- aiq/cli/commands/registry/registry.py +38 -0
- aiq/cli/commands/registry/remove.py +108 -0
- aiq/cli/commands/registry/search.py +155 -0
- aiq/cli/commands/sizing/__init__.py +14 -0
- aiq/cli/commands/sizing/calc.py +297 -0
- aiq/cli/commands/sizing/sizing.py +27 -0
- aiq/cli/commands/start.py +246 -0
- aiq/cli/commands/uninstall.py +81 -0
- aiq/cli/commands/validate.py +47 -0
- aiq/cli/commands/workflow/__init__.py +14 -0
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
- aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- aiq/cli/commands/workflow/workflow.py +37 -0
- aiq/cli/commands/workflow/workflow_commands.py +313 -0
- aiq/cli/entrypoint.py +135 -0
- aiq/cli/main.py +44 -0
- aiq/cli/register_workflow.py +488 -0
- aiq/cli/type_registry.py +1000 -0
- aiq/data_models/__init__.py +14 -0
- aiq/data_models/api_server.py +694 -0
- aiq/data_models/authentication.py +231 -0
- aiq/data_models/common.py +171 -0
- aiq/data_models/component.py +54 -0
- aiq/data_models/component_ref.py +168 -0
- aiq/data_models/config.py +406 -0
- aiq/data_models/dataset_handler.py +123 -0
- aiq/data_models/discovery_metadata.py +335 -0
- aiq/data_models/embedder.py +27 -0
- aiq/data_models/evaluate.py +127 -0
- aiq/data_models/evaluator.py +26 -0
- aiq/data_models/front_end.py +26 -0
- aiq/data_models/function.py +30 -0
- aiq/data_models/function_dependencies.py +72 -0
- aiq/data_models/interactive.py +246 -0
- aiq/data_models/intermediate_step.py +302 -0
- aiq/data_models/invocation_node.py +38 -0
- aiq/data_models/llm.py +27 -0
- aiq/data_models/logging.py +26 -0
- aiq/data_models/memory.py +27 -0
- aiq/data_models/object_store.py +44 -0
- aiq/data_models/profiler.py +54 -0
- aiq/data_models/registry_handler.py +26 -0
- aiq/data_models/retriever.py +30 -0
- aiq/data_models/retry_mixin.py +35 -0
- aiq/data_models/span.py +187 -0
- aiq/data_models/step_adaptor.py +64 -0
- aiq/data_models/streaming.py +33 -0
- aiq/data_models/swe_bench_model.py +54 -0
- aiq/data_models/telemetry_exporter.py +26 -0
- aiq/data_models/ttc_strategy.py +30 -0
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +41 -0
- aiq/embedder/nim_embedder.py +59 -0
- aiq/embedder/openai_embedder.py +43 -0
- aiq/embedder/register.py +24 -0
- aiq/eval/__init__.py +14 -0
- aiq/eval/config.py +60 -0
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +106 -0
- aiq/eval/dataset_handler/dataset_filter.py +52 -0
- aiq/eval/dataset_handler/dataset_handler.py +254 -0
- aiq/eval/evaluate.py +506 -0
- aiq/eval/evaluator/__init__.py +14 -0
- aiq/eval/evaluator/base_evaluator.py +73 -0
- aiq/eval/evaluator/evaluator_model.py +45 -0
- aiq/eval/intermediate_step_adapter.py +99 -0
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +178 -0
- aiq/eval/rag_evaluator/register.py +143 -0
- aiq/eval/register.py +23 -0
- aiq/eval/remote_workflow.py +133 -0
- aiq/eval/runners/__init__.py +14 -0
- aiq/eval/runners/config.py +39 -0
- aiq/eval/runners/multi_eval_runner.py +54 -0
- aiq/eval/runtime_event_subscriber.py +52 -0
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
- aiq/eval/swe_bench_evaluator/register.py +36 -0
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +75 -0
- aiq/eval/trajectory_evaluator/register.py +40 -0
- aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
- aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
- aiq/eval/tunable_rag_evaluator/register.py +52 -0
- aiq/eval/usage_stats.py +41 -0
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +140 -0
- aiq/eval/utils/tqdm_position_registry.py +40 -0
- aiq/eval/utils/weave_eval.py +184 -0
- aiq/experimental/__init__.py +0 -0
- aiq/experimental/decorators/__init__.py +0 -0
- aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
- aiq/experimental/test_time_compute/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- aiq/experimental/test_time_compute/functions/__init__.py +0 -0
- aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
- aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
- aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- aiq/experimental/test_time_compute/models/__init__.py +0 -0
- aiq/experimental/test_time_compute/models/editor_config.py +132 -0
- aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
- aiq/experimental/test_time_compute/models/search_config.py +120 -0
- aiq/experimental/test_time_compute/models/selection_config.py +154 -0
- aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
- aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
- aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
- aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
- aiq/experimental/test_time_compute/register.py +36 -0
- aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
- aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- aiq/experimental/test_time_compute/search/__init__.py +0 -0
- aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- aiq/experimental/test_time_compute/selection/__init__.py +0 -0
- aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- aiq/front_ends/__init__.py +14 -0
- aiq/front_ends/console/__init__.py +14 -0
- aiq/front_ends/console/authentication_flow_handler.py +233 -0
- aiq/front_ends/console/console_front_end_config.py +32 -0
- aiq/front_ends/console/console_front_end_plugin.py +96 -0
- aiq/front_ends/console/register.py +25 -0
- aiq/front_ends/cron/__init__.py +14 -0
- aiq/front_ends/fastapi/__init__.py +14 -0
- aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
- aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
- aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
- aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- aiq/front_ends/fastapi/job_store.py +183 -0
- aiq/front_ends/fastapi/main.py +72 -0
- aiq/front_ends/fastapi/message_handler.py +298 -0
- aiq/front_ends/fastapi/message_validator.py +345 -0
- aiq/front_ends/fastapi/register.py +25 -0
- aiq/front_ends/fastapi/response_helpers.py +195 -0
- aiq/front_ends/fastapi/step_adaptor.py +321 -0
- aiq/front_ends/mcp/__init__.py +14 -0
- aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
- aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
- aiq/front_ends/mcp/register.py +27 -0
- aiq/front_ends/mcp/tool_converter.py +242 -0
- aiq/front_ends/register.py +22 -0
- aiq/front_ends/simple_base/__init__.py +14 -0
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- aiq/llm/__init__.py +0 -0
- aiq/llm/aws_bedrock_llm.py +57 -0
- aiq/llm/nim_llm.py +46 -0
- aiq/llm/openai_llm.py +46 -0
- aiq/llm/register.py +23 -0
- aiq/llm/utils/__init__.py +14 -0
- aiq/llm/utils/env_config_value.py +94 -0
- aiq/llm/utils/error.py +17 -0
- aiq/memory/__init__.py +20 -0
- aiq/memory/interfaces.py +183 -0
- aiq/memory/models.py +112 -0
- aiq/meta/module_to_distro.json +3 -0
- aiq/meta/pypi.md +58 -0
- aiq/object_store/__init__.py +20 -0
- aiq/object_store/in_memory_object_store.py +76 -0
- aiq/object_store/interfaces.py +84 -0
- aiq/object_store/models.py +36 -0
- aiq/object_store/register.py +20 -0
- aiq/observability/__init__.py +14 -0
- aiq/observability/exporter/__init__.py +14 -0
- aiq/observability/exporter/base_exporter.py +449 -0
- aiq/observability/exporter/exporter.py +78 -0
- aiq/observability/exporter/file_exporter.py +33 -0
- aiq/observability/exporter/processing_exporter.py +322 -0
- aiq/observability/exporter/raw_exporter.py +52 -0
- aiq/observability/exporter/span_exporter.py +265 -0
- aiq/observability/exporter_manager.py +335 -0
- aiq/observability/mixin/__init__.py +14 -0
- aiq/observability/mixin/batch_config_mixin.py +26 -0
- aiq/observability/mixin/collector_config_mixin.py +23 -0
- aiq/observability/mixin/file_mixin.py +288 -0
- aiq/observability/mixin/file_mode.py +23 -0
- aiq/observability/mixin/resource_conflict_mixin.py +134 -0
- aiq/observability/mixin/serialize_mixin.py +61 -0
- aiq/observability/mixin/type_introspection_mixin.py +183 -0
- aiq/observability/processor/__init__.py +14 -0
- aiq/observability/processor/batching_processor.py +310 -0
- aiq/observability/processor/callback_processor.py +42 -0
- aiq/observability/processor/intermediate_step_serializer.py +28 -0
- aiq/observability/processor/processor.py +71 -0
- aiq/observability/register.py +96 -0
- aiq/observability/utils/__init__.py +14 -0
- aiq/observability/utils/dict_utils.py +236 -0
- aiq/observability/utils/time_utils.py +31 -0
- aiq/plugins/.namespace +1 -0
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/calc/__init__.py +14 -0
- aiq/profiler/calc/calc_runner.py +627 -0
- aiq/profiler/calc/calculations.py +288 -0
- aiq/profiler/calc/data_models.py +188 -0
- aiq/profiler/calc/plot.py +345 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +295 -0
- aiq/profiler/callbacks/base_callback_class.py +20 -0
- aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
- aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- aiq/profiler/callbacks/token_usage_base_model.py +27 -0
- aiq/profiler/data_frame_row.py +51 -0
- aiq/profiler/data_models.py +24 -0
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +131 -0
- aiq/profiler/decorators/function_tracking.py +254 -0
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +18 -0
- aiq/profiler/forecasting/model_trainer.py +75 -0
- aiq/profiler/forecasting/models/__init__.py +22 -0
- aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
- aiq/profiler/forecasting/models/linear_model.py +196 -0
- aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
- aiq/profiler/inference_metrics_model.py +28 -0
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- aiq/profiler/inference_optimization/data_models.py +386 -0
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- aiq/profiler/inference_optimization/llm_metrics.py +212 -0
- aiq/profiler/inference_optimization/prompt_caching.py +163 -0
- aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
- aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
- aiq/profiler/intermediate_property_adapter.py +102 -0
- aiq/profiler/profile_runner.py +473 -0
- aiq/profiler/utils.py +184 -0
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +176 -0
- aiq/registry_handlers/local/register_local.py +37 -0
- aiq/registry_handlers/metadata_factory.py +60 -0
- aiq/registry_handlers/package_utils.py +567 -0
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +251 -0
- aiq/registry_handlers/pypi/register_pypi.py +40 -0
- aiq/registry_handlers/register.py +21 -0
- aiq/registry_handlers/registry_handler_base.py +157 -0
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +56 -0
- aiq/registry_handlers/rest/rest_handler.py +237 -0
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +42 -0
- aiq/registry_handlers/schemas/package.py +68 -0
- aiq/registry_handlers/schemas/publish.py +63 -0
- aiq/registry_handlers/schemas/pull.py +82 -0
- aiq/registry_handlers/schemas/remove.py +36 -0
- aiq/registry_handlers/schemas/search.py +91 -0
- aiq/registry_handlers/schemas/status.py +47 -0
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +37 -0
- aiq/retriever/milvus/__init__.py +14 -0
- aiq/retriever/milvus/register.py +81 -0
- aiq/retriever/milvus/retriever.py +228 -0
- aiq/retriever/models.py +74 -0
- aiq/retriever/nemo_retriever/__init__.py +14 -0
- aiq/retriever/nemo_retriever/register.py +60 -0
- aiq/retriever/nemo_retriever/retriever.py +190 -0
- aiq/retriever/register.py +22 -0
- aiq/runtime/__init__.py +14 -0
- aiq/runtime/loader.py +215 -0
- aiq/runtime/runner.py +190 -0
- aiq/runtime/session.py +158 -0
- aiq/runtime/user_metadata.py +130 -0
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +318 -0
- aiq/test/.namespace +1 -0
- aiq/tool/__init__.py +0 -0
- aiq/tool/chat_completion.py +74 -0
- aiq/tool/code_execution/README.md +151 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +267 -0
- aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- aiq/tool/code_execution/register.py +74 -0
- aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
- aiq/tool/code_execution/utils.py +100 -0
- aiq/tool/datetime_tools.py +42 -0
- aiq/tool/document_search.py +141 -0
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +133 -0
- aiq/tool/github_tools/create_github_issue.py +87 -0
- aiq/tool/github_tools/create_github_pr.py +106 -0
- aiq/tool/github_tools/get_github_file.py +106 -0
- aiq/tool/github_tools/get_github_issue.py +166 -0
- aiq/tool/github_tools/get_github_pr.py +256 -0
- aiq/tool/github_tools/update_github_issue.py +100 -0
- aiq/tool/mcp/__init__.py +14 -0
- aiq/tool/mcp/exceptions.py +142 -0
- aiq/tool/mcp/mcp_client.py +255 -0
- aiq/tool/mcp/mcp_tool.py +96 -0
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +79 -0
- aiq/tool/memory_tools/delete_memory_tool.py +67 -0
- aiq/tool/memory_tools/get_memory_tool.py +72 -0
- aiq/tool/nvidia_rag.py +95 -0
- aiq/tool/register.py +38 -0
- aiq/tool/retriever.py +89 -0
- aiq/tool/server_tools.py +66 -0
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +58 -0
- aiq/utils/debugging_utils.py +43 -0
- aiq/utils/dump_distro_mapping.py +32 -0
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/automatic_retries.py +289 -0
- aiq/utils/exception_handlers/mcp.py +211 -0
- aiq/utils/exception_handlers/schemas.py +114 -0
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/model_processing.py +28 -0
- aiq/utils/io/yaml_tools.py +119 -0
- aiq/utils/log_utils.py +37 -0
- aiq/utils/metadata_utils.py +74 -0
- aiq/utils/optional_imports.py +142 -0
- aiq/utils/producer_consumer_queue.py +178 -0
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +65 -0
- aiq/utils/reactive/base/observer_base.py +55 -0
- aiq/utils/reactive/base/subject_base.py +79 -0
- aiq/utils/reactive/observable.py +59 -0
- aiq/utils/reactive/observer.py +76 -0
- aiq/utils/reactive/subject.py +131 -0
- aiq/utils/reactive/subscription.py +49 -0
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +197 -0
- aiq/utils/string_utils.py +38 -0
- aiq/utils/type_converter.py +290 -0
- aiq/utils/type_utils.py +484 -0
- aiq/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
- nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from aiq.builder.builder import Builder
|
|
19
|
+
from aiq.cli.register_workflow import register_ttc_strategy
|
|
20
|
+
from aiq.experimental.test_time_compute.models.selection_config import BestOfNSelectionConfig
|
|
21
|
+
from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
22
|
+
from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
23
|
+
from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
24
|
+
from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
25
|
+
|
|
26
|
+
logger = logging.getLogger(__name__)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class BestOfNSelector(StrategyBase):
|
|
30
|
+
|
|
31
|
+
async def build_components(self, builder: Builder) -> None:
|
|
32
|
+
pass
|
|
33
|
+
|
|
34
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
35
|
+
return [PipelineTypeEnum.PLANNING, PipelineTypeEnum.AGENT_EXECUTION, PipelineTypeEnum.TOOL_USE]
|
|
36
|
+
|
|
37
|
+
def stage_type(self) -> StageTypeEnum:
|
|
38
|
+
return StageTypeEnum.SELECTION
|
|
39
|
+
|
|
40
|
+
async def ainvoke(self,
|
|
41
|
+
items: list[TTCItem],
|
|
42
|
+
original_prompt: str | None = None,
|
|
43
|
+
agent_context: str | None = None,
|
|
44
|
+
**kwargs) -> [TTCItem]:
|
|
45
|
+
|
|
46
|
+
# Assert that every planning item has a non NoneType score
|
|
47
|
+
for item in items:
|
|
48
|
+
if item.score is None:
|
|
49
|
+
raise ValueError("Every planning item must have a score. Did you use a scorer before this?")
|
|
50
|
+
|
|
51
|
+
# Pick the planning item with the highest score
|
|
52
|
+
best_item = max(items, key=lambda x: x.score)
|
|
53
|
+
|
|
54
|
+
return [best_item]
|
|
55
|
+
|
|
56
|
+
|
|
57
|
+
@register_ttc_strategy(config_type=BestOfNSelectionConfig)
|
|
58
|
+
async def register_best_of_n_selector(config: BestOfNSelectionConfig, builder: Builder):
|
|
59
|
+
"""
|
|
60
|
+
Register the BestOfNSelector strategy.
|
|
61
|
+
"""
|
|
62
|
+
selector = BestOfNSelector(config)
|
|
63
|
+
yield selector
|
|
@@ -0,0 +1,131 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
import re
|
|
18
|
+
|
|
19
|
+
from aiq.builder.builder import Builder
|
|
20
|
+
from aiq.builder.framework_enum import LLMFrameworkEnum
|
|
21
|
+
from aiq.cli.register_workflow import register_ttc_strategy
|
|
22
|
+
from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
23
|
+
from aiq.experimental.test_time_compute.models.selection_config import LLMBasedAgentOutputSelectionConfig
|
|
24
|
+
from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
25
|
+
from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
26
|
+
from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
27
|
+
from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
28
|
+
from aiq.utils.io.model_processing import remove_r1_think_tags
|
|
29
|
+
|
|
30
|
+
logger = logging.getLogger(__name__)
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
class LLMBasedAgentOutputSelector(StrategyBase):
|
|
34
|
+
|
|
35
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
36
|
+
super().__init__(config)
|
|
37
|
+
self.llm_bound = None
|
|
38
|
+
|
|
39
|
+
async def build_components(self, builder: Builder) -> None:
|
|
40
|
+
"""
|
|
41
|
+
Build the components required for the selector.
|
|
42
|
+
"""
|
|
43
|
+
self.llm_bound = await builder.get_llm(self.config.selection_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
44
|
+
|
|
45
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
46
|
+
return [PipelineTypeEnum.AGENT_EXECUTION]
|
|
47
|
+
|
|
48
|
+
def stage_type(self) -> StageTypeEnum:
|
|
49
|
+
return StageTypeEnum.SELECTION
|
|
50
|
+
|
|
51
|
+
async def ainvoke(self,
|
|
52
|
+
items: list[TTCItem],
|
|
53
|
+
original_prompt: str | None = None,
|
|
54
|
+
agent_context: str | None = None,
|
|
55
|
+
**kwargs) -> [TTCItem]:
|
|
56
|
+
"""
|
|
57
|
+
Select the planning items based on the selection strategy.
|
|
58
|
+
|
|
59
|
+
Args:
|
|
60
|
+
original_prompt (str): The prompt the user provided the agent.
|
|
61
|
+
agent_context (str): The context of the agent, if applicable.
|
|
62
|
+
items (list[TTCItem]): The list of planning items to select from.
|
|
63
|
+
|
|
64
|
+
Returns:
|
|
65
|
+
TTCItem: The selected planning item.
|
|
66
|
+
"""
|
|
67
|
+
|
|
68
|
+
try:
|
|
69
|
+
from langchain_core.language_models import BaseChatModel
|
|
70
|
+
from langchain_core.prompts import PromptTemplate
|
|
71
|
+
except ImportError:
|
|
72
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
73
|
+
"This error can be resolved by installing aiqtoolkit-langchain.")
|
|
74
|
+
|
|
75
|
+
from pydantic import BaseModel
|
|
76
|
+
|
|
77
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
78
|
+
raise ValueError("The `selection_llm` must be an instance of `BaseChatModel`.")
|
|
79
|
+
|
|
80
|
+
model: BaseChatModel = self.llm_bound
|
|
81
|
+
|
|
82
|
+
results = ""
|
|
83
|
+
for idx, item in enumerate(items):
|
|
84
|
+
item_str = str(item.output.model_dump()) if isinstance(item.output, BaseModel) else str(item.output)
|
|
85
|
+
results += f"{idx + 1}. {remove_r1_think_tags(item_str)}\n\n"
|
|
86
|
+
|
|
87
|
+
prompt_template = PromptTemplate(
|
|
88
|
+
template=self.config.selection_template,
|
|
89
|
+
input_variables=["objective", "input", "results"],
|
|
90
|
+
validate_template=True,
|
|
91
|
+
)
|
|
92
|
+
|
|
93
|
+
prompt = (await prompt_template.ainvoke(input={
|
|
94
|
+
"objective": agent_context, "input": original_prompt, "results": results
|
|
95
|
+
})).to_string()
|
|
96
|
+
|
|
97
|
+
selected_plan_index = remove_r1_think_tags((await model.ainvoke(prompt)).content)
|
|
98
|
+
|
|
99
|
+
# Model Response will be 'Plan {plan number}'
|
|
100
|
+
# Use RegEx to extrac Plan {idx} from response strong
|
|
101
|
+
if not isinstance(selected_plan_index, str):
|
|
102
|
+
logger.warning(f"Invalid response from LLM for selected plan index: {selected_plan_index}.")
|
|
103
|
+
raise ValueError("Unable to parse the selected plan index.")
|
|
104
|
+
selected_plan_index = selected_plan_index.strip()
|
|
105
|
+
match = re.match(r'^\s*SELECTED ITEM:\s+(\d+)', selected_plan_index)
|
|
106
|
+
if not match:
|
|
107
|
+
logger.warning(f"Could not parse the selected plan index from the response: {selected_plan_index}.")
|
|
108
|
+
raise ValueError("The response format for selecting the item is incorrect.")
|
|
109
|
+
index = match.group(1)
|
|
110
|
+
|
|
111
|
+
try:
|
|
112
|
+
selected_index = int(index) - 1
|
|
113
|
+
if selected_index < 0 or selected_index >= len(items):
|
|
114
|
+
raise ValueError("Selected index is out of range.")
|
|
115
|
+
|
|
116
|
+
# Return the selected planning item
|
|
117
|
+
return [items[selected_index]]
|
|
118
|
+
except ValueError as e:
|
|
119
|
+
logger.warning(f"Error parsing the selected plan index: {index}. Exception: {str(e)}")
|
|
120
|
+
raise ValueError(f"Failed to parse the selected plan index from the LLM response: {selected_plan_index}. "
|
|
121
|
+
"Ensure the response follows the expected format.") from e
|
|
122
|
+
|
|
123
|
+
|
|
124
|
+
@register_ttc_strategy(config_type=LLMBasedAgentOutputSelectionConfig)
|
|
125
|
+
async def register_llm_based_agent_output_selector(config: LLMBasedAgentOutputSelectionConfig, builder: Builder):
|
|
126
|
+
"""
|
|
127
|
+
Register the LLMBasedAgentOutputSelector with the builder.
|
|
128
|
+
"""
|
|
129
|
+
selector = LLMBasedAgentOutputSelector(config)
|
|
130
|
+
await selector.build_components(builder)
|
|
131
|
+
yield selector
|
|
@@ -0,0 +1,159 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from aiq.builder.builder import Builder
|
|
19
|
+
from aiq.builder.framework_enum import LLMFrameworkEnum
|
|
20
|
+
from aiq.cli.register_workflow import register_ttc_strategy
|
|
21
|
+
from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
22
|
+
from aiq.experimental.test_time_compute.models.selection_config import LLMBasedOutputMergingConfig
|
|
23
|
+
from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
24
|
+
from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
25
|
+
from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
26
|
+
from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
27
|
+
from aiq.utils.io.model_processing import remove_r1_think_tags
|
|
28
|
+
|
|
29
|
+
logger = logging.getLogger(__name__)
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
class LLMBasedOutputMergingSelector(StrategyBase):
|
|
33
|
+
|
|
34
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
35
|
+
super().__init__(config)
|
|
36
|
+
self.llm_bound = None
|
|
37
|
+
|
|
38
|
+
async def build_components(self, builder: Builder) -> None:
|
|
39
|
+
"""
|
|
40
|
+
Build the components required for the selector.
|
|
41
|
+
"""
|
|
42
|
+
self.llm_bound = await builder.get_llm(self.config.selection_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
43
|
+
|
|
44
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
45
|
+
return [PipelineTypeEnum.AGENT_EXECUTION, PipelineTypeEnum.PLANNING]
|
|
46
|
+
|
|
47
|
+
def stage_type(self) -> StageTypeEnum:
|
|
48
|
+
return StageTypeEnum.SELECTION
|
|
49
|
+
|
|
50
|
+
async def ainvoke(self,
|
|
51
|
+
items: list[TTCItem],
|
|
52
|
+
original_prompt: str | None = None,
|
|
53
|
+
agent_context: str | None = None,
|
|
54
|
+
**kwargs) -> [TTCItem]:
|
|
55
|
+
"""
|
|
56
|
+
Merge the outputs of multiple planning items into a single output
|
|
57
|
+
|
|
58
|
+
Args:
|
|
59
|
+
original_prompt (str): The prompt the user provided the agent.
|
|
60
|
+
agent_context (str): The context of the agent, if applicable.
|
|
61
|
+
items (list[TTCItem]): The list of planning items to select from.
|
|
62
|
+
|
|
63
|
+
Returns:
|
|
64
|
+
TTCItem: The selected planning item.
|
|
65
|
+
"""
|
|
66
|
+
|
|
67
|
+
try:
|
|
68
|
+
from langchain_core.language_models import BaseChatModel
|
|
69
|
+
from langchain_core.prompts import PromptTemplate
|
|
70
|
+
except ImportError:
|
|
71
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
72
|
+
"This error can be resolved by installing aiqtoolkit-langchain.")
|
|
73
|
+
|
|
74
|
+
from typing import Callable
|
|
75
|
+
|
|
76
|
+
from pydantic import BaseModel
|
|
77
|
+
|
|
78
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
79
|
+
raise ValueError("The `selection_llm` must be an instance of `BaseChatModel`.")
|
|
80
|
+
|
|
81
|
+
if not self.pipeline_type:
|
|
82
|
+
raise RuntimeError("Pipeline type is not set. Ensure that the pipeline "
|
|
83
|
+
"type is set before invoking the selector.")
|
|
84
|
+
|
|
85
|
+
model: BaseChatModel = self.llm_bound
|
|
86
|
+
|
|
87
|
+
results = ""
|
|
88
|
+
if self.pipeline_type == PipelineTypeEnum.AGENT_EXECUTION:
|
|
89
|
+
for idx, item in enumerate(items):
|
|
90
|
+
item_str = str(item.output.model_dump()) if isinstance(item.output, BaseModel) else str(item.output)
|
|
91
|
+
results += f"{idx + 1}. {remove_r1_think_tags(item_str)}\n\n"
|
|
92
|
+
else:
|
|
93
|
+
for idx, item in enumerate(items):
|
|
94
|
+
item_str = str(item.plan)
|
|
95
|
+
results += f"{idx + 1}. {remove_r1_think_tags(item_str)}\n\n"
|
|
96
|
+
|
|
97
|
+
prompt_template = PromptTemplate(
|
|
98
|
+
template=self.config.selection_template,
|
|
99
|
+
input_variables=["pipeline_type", "objective", "input", "results"],
|
|
100
|
+
validate_template=True,
|
|
101
|
+
)
|
|
102
|
+
|
|
103
|
+
if self.pipeline_type == PipelineTypeEnum.PLANNING:
|
|
104
|
+
pipeline_objective = "execution plans for a given objective and input."
|
|
105
|
+
else:
|
|
106
|
+
pipeline_objective = "outputs from an agent system based on the provided objective and input."
|
|
107
|
+
|
|
108
|
+
prompt = (await prompt_template.ainvoke(
|
|
109
|
+
input={
|
|
110
|
+
"objective": agent_context,
|
|
111
|
+
"input": original_prompt,
|
|
112
|
+
"results": results,
|
|
113
|
+
"pipeline_type": pipeline_objective
|
|
114
|
+
})).to_string()
|
|
115
|
+
|
|
116
|
+
merged_output = remove_r1_think_tags((await model.ainvoke(prompt)).content)
|
|
117
|
+
|
|
118
|
+
if not isinstance(merged_output, str):
|
|
119
|
+
logger.warning(f"Invalid response from LLM for merged_plan: {merged_output}.")
|
|
120
|
+
raise ValueError("Unable to parse merged plan.")
|
|
121
|
+
merged_output = merged_output.strip()
|
|
122
|
+
|
|
123
|
+
# match = split the string after 'MERGED OUTPUT:'
|
|
124
|
+
matches = merged_output.split("MERGED OUTPUT:")
|
|
125
|
+
if len(matches) > 1:
|
|
126
|
+
merged_output = matches[-1].strip()
|
|
127
|
+
else:
|
|
128
|
+
raise ValueError("Merged output does not contain 'MERGED OUTPUT:' prefix.")
|
|
129
|
+
|
|
130
|
+
# Check if a callable argument is provided in kwargs called output_parser
|
|
131
|
+
output_parser: Callable | None = kwargs.get('output_parser', None)
|
|
132
|
+
if output_parser:
|
|
133
|
+
try:
|
|
134
|
+
merged_output = output_parser(merged_output)
|
|
135
|
+
except Exception as e:
|
|
136
|
+
logger.error(f"Error parsing merged output: {e}")
|
|
137
|
+
raise ValueError("Failed to parse merged output.")
|
|
138
|
+
else:
|
|
139
|
+
merged_output = merged_output
|
|
140
|
+
|
|
141
|
+
logger.info("Merged output: %s", str(merged_output))
|
|
142
|
+
|
|
143
|
+
# Create a new TTCItem with the merged plan or output
|
|
144
|
+
if self.pipeline_type == PipelineTypeEnum.PLANNING:
|
|
145
|
+
merged_item = TTCItem(input=items[0].input, output=merged_output, plan=merged_output)
|
|
146
|
+
else:
|
|
147
|
+
merged_item = TTCItem(input=items[0].input, output=merged_output)
|
|
148
|
+
|
|
149
|
+
return [merged_item]
|
|
150
|
+
|
|
151
|
+
|
|
152
|
+
@register_ttc_strategy(config_type=LLMBasedOutputMergingConfig)
|
|
153
|
+
async def register_llm_based_output_merging_selector(config: LLMBasedOutputMergingConfig, builder: Builder):
|
|
154
|
+
"""
|
|
155
|
+
Register the LLMBasedOutputMergingSelector with the builder.
|
|
156
|
+
"""
|
|
157
|
+
selector = LLMBasedOutputMergingSelector(config)
|
|
158
|
+
await selector.build_components(builder)
|
|
159
|
+
yield selector
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
import re
|
|
18
|
+
|
|
19
|
+
from aiq.builder.builder import Builder
|
|
20
|
+
from aiq.builder.framework_enum import LLMFrameworkEnum
|
|
21
|
+
from aiq.cli.register_workflow import register_ttc_strategy
|
|
22
|
+
from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
|
|
23
|
+
from aiq.experimental.test_time_compute.models.selection_config import LLMBasedPlanSelectionConfig
|
|
24
|
+
from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
25
|
+
from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
26
|
+
from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
27
|
+
from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
28
|
+
from aiq.utils.io.model_processing import remove_r1_think_tags
|
|
29
|
+
|
|
30
|
+
logger = logging.getLogger(__name__)
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
class LLMBasedPlanSelector(StrategyBase):
|
|
34
|
+
|
|
35
|
+
def __init__(self, config: TTCStrategyBaseConfig) -> None:
|
|
36
|
+
super().__init__(config)
|
|
37
|
+
self.llm_bound = None
|
|
38
|
+
|
|
39
|
+
async def build_components(self, builder: Builder) -> None:
|
|
40
|
+
"""
|
|
41
|
+
Build the components required for the selector.
|
|
42
|
+
"""
|
|
43
|
+
self.llm_bound = await builder.get_llm(self.config.selection_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
44
|
+
|
|
45
|
+
def supported_pipeline_types(self) -> [PipelineTypeEnum]:
|
|
46
|
+
return [PipelineTypeEnum.PLANNING]
|
|
47
|
+
|
|
48
|
+
def stage_type(self) -> StageTypeEnum:
|
|
49
|
+
return StageTypeEnum.SELECTION
|
|
50
|
+
|
|
51
|
+
async def ainvoke(self,
|
|
52
|
+
items: list[TTCItem],
|
|
53
|
+
original_prompt: str | None = None,
|
|
54
|
+
agent_context: str | None = None,
|
|
55
|
+
**kwargs) -> [TTCItem]:
|
|
56
|
+
"""
|
|
57
|
+
Select the planning items based on the selection strategy.
|
|
58
|
+
|
|
59
|
+
Args:
|
|
60
|
+
original_prompt (str): The prompt the user provided the agent.
|
|
61
|
+
agent_context (str): The context of the agent, if applicable.
|
|
62
|
+
items (list[TTCItem]): The list of planning items to select from.
|
|
63
|
+
|
|
64
|
+
Returns:
|
|
65
|
+
TTCItem: The selected planning item.
|
|
66
|
+
"""
|
|
67
|
+
|
|
68
|
+
try:
|
|
69
|
+
from langchain_core.language_models import BaseChatModel
|
|
70
|
+
from langchain_core.prompts import PromptTemplate
|
|
71
|
+
except ImportError:
|
|
72
|
+
raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
|
|
73
|
+
"This error can be resolved by installing aiqtoolkit-langchain.")
|
|
74
|
+
|
|
75
|
+
if not isinstance(self.llm_bound, BaseChatModel):
|
|
76
|
+
raise ValueError("The `selection_llm` must be an instance of `BaseChatModel`.")
|
|
77
|
+
|
|
78
|
+
model: BaseChatModel = self.llm_bound
|
|
79
|
+
|
|
80
|
+
plans = ""
|
|
81
|
+
for idx, item in enumerate(items):
|
|
82
|
+
plans += f"{idx + 1}. {remove_r1_think_tags(item.plan)}\n"
|
|
83
|
+
|
|
84
|
+
prompt_template = PromptTemplate(
|
|
85
|
+
template=self.config.selection_template,
|
|
86
|
+
input_variables=["original_prompt", "context", "plans"],
|
|
87
|
+
validate_template=True,
|
|
88
|
+
)
|
|
89
|
+
|
|
90
|
+
prompt = (await prompt_template.ainvoke(input={
|
|
91
|
+
"original_prompt": original_prompt, "context": agent_context, "plans": plans
|
|
92
|
+
})).to_string()
|
|
93
|
+
|
|
94
|
+
selected_plan_index = remove_r1_think_tags((await model.ainvoke(prompt)).content)
|
|
95
|
+
|
|
96
|
+
# Model Response will be 'Plan {plan number}'
|
|
97
|
+
# Use RegEx to extrac Plan {idx} from response strong
|
|
98
|
+
if not isinstance(selected_plan_index, str):
|
|
99
|
+
logger.warning(f"Invalid response from LLM for selected plan index: {selected_plan_index}.")
|
|
100
|
+
raise ValueError("Unable to parse the selected plan index.")
|
|
101
|
+
selected_plan_index = selected_plan_index.strip()
|
|
102
|
+
match = re.match(r'^\s*SELECTED PLAN:\s+(\d+)', selected_plan_index)
|
|
103
|
+
if not match:
|
|
104
|
+
logger.warning(f"Could not parse the selected plan index from the response: {selected_plan_index}.")
|
|
105
|
+
raise ValueError("The response format for selecting the plan is incorrect.")
|
|
106
|
+
index = match.group(1)
|
|
107
|
+
|
|
108
|
+
try:
|
|
109
|
+
selected_index = int(index) - 1
|
|
110
|
+
if selected_index < 0 or selected_index >= len(items):
|
|
111
|
+
raise ValueError("Selected index is out of range.")
|
|
112
|
+
|
|
113
|
+
# Return the selected planning item
|
|
114
|
+
return [items[selected_index]]
|
|
115
|
+
except ValueError as e:
|
|
116
|
+
logger.warning(f"Error parsing the selected plan index: {index}. Exception: {str(e)}")
|
|
117
|
+
raise ValueError(f"Failed to parse the selected plan index from the LLM response: {selected_plan_index}. "
|
|
118
|
+
"Ensure the response follows the expected format.") from e
|
|
119
|
+
|
|
120
|
+
|
|
121
|
+
@register_ttc_strategy(config_type=LLMBasedPlanSelectionConfig)
|
|
122
|
+
async def register_llm_based_plan_selection(config: LLMBasedPlanSelectionConfig, builder: Builder):
|
|
123
|
+
"""
|
|
124
|
+
Register the LLMBasedPlanSelector with the provided configuration.
|
|
125
|
+
"""
|
|
126
|
+
selector = LLMBasedPlanSelector(config)
|
|
127
|
+
await selector.build_components(Builder())
|
|
128
|
+
yield selector
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
|
|
18
|
+
from aiq.builder.builder import Builder
|
|
19
|
+
from aiq.cli.register_workflow import register_ttc_strategy
|
|
20
|
+
from aiq.experimental.test_time_compute.models.selection_config import ThresholdSelectionConfig
|
|
21
|
+
from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
|
|
22
|
+
from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
|
|
23
|
+
from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
|
|
24
|
+
from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
|
|
25
|
+
|
|
26
|
+
logger = logging.getLogger(__name__)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class ThresholdSelector(StrategyBase):
|
|
30
|
+
"""
|
|
31
|
+
Downselects only those TTCItems whose 'score' >= config.threshold.
|
|
32
|
+
"""
|
|
33
|
+
|
|
34
|
+
async def build_components(self, builder: Builder) -> None:
|
|
35
|
+
# No special components needed
|
|
36
|
+
pass
|
|
37
|
+
|
|
38
|
+
def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
|
|
39
|
+
return [PipelineTypeEnum.TOOL_USE]
|
|
40
|
+
|
|
41
|
+
def stage_type(self) -> StageTypeEnum:
|
|
42
|
+
return StageTypeEnum.SELECTION
|
|
43
|
+
|
|
44
|
+
async def ainvoke(self,
|
|
45
|
+
items: list[TTCItem],
|
|
46
|
+
original_prompt: str | None = None,
|
|
47
|
+
agent_context: str | None = None,
|
|
48
|
+
**kwargs) -> list[TTCItem]:
|
|
49
|
+
threshold = self.config.threshold
|
|
50
|
+
selected = [itm for itm in items if (itm.score is not None and itm.score >= threshold)]
|
|
51
|
+
logger.info("ThresholdSelector: %d items => %d items (threshold=%.1f)", len(items), len(selected), threshold)
|
|
52
|
+
return selected
|
|
53
|
+
|
|
54
|
+
|
|
55
|
+
@register_ttc_strategy(config_type=ThresholdSelectionConfig)
|
|
56
|
+
async def register_threshold_selector(config: ThresholdSelectionConfig, builder: Builder):
|
|
57
|
+
selector = ThresholdSelector(config)
|
|
58
|
+
yield selector
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|