nvidia-nat 1.2.0rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (435) hide show
  1. aiq/agent/__init__.py +0 -0
  2. aiq/agent/base.py +239 -0
  3. aiq/agent/dual_node.py +67 -0
  4. aiq/agent/react_agent/__init__.py +0 -0
  5. aiq/agent/react_agent/agent.py +355 -0
  6. aiq/agent/react_agent/output_parser.py +104 -0
  7. aiq/agent/react_agent/prompt.py +41 -0
  8. aiq/agent/react_agent/register.py +149 -0
  9. aiq/agent/reasoning_agent/__init__.py +0 -0
  10. aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
  11. aiq/agent/register.py +23 -0
  12. aiq/agent/rewoo_agent/__init__.py +0 -0
  13. aiq/agent/rewoo_agent/agent.py +411 -0
  14. aiq/agent/rewoo_agent/prompt.py +108 -0
  15. aiq/agent/rewoo_agent/register.py +158 -0
  16. aiq/agent/tool_calling_agent/__init__.py +0 -0
  17. aiq/agent/tool_calling_agent/agent.py +119 -0
  18. aiq/agent/tool_calling_agent/register.py +106 -0
  19. aiq/authentication/__init__.py +14 -0
  20. aiq/authentication/api_key/__init__.py +14 -0
  21. aiq/authentication/api_key/api_key_auth_provider.py +96 -0
  22. aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
  23. aiq/authentication/api_key/register.py +26 -0
  24. aiq/authentication/exceptions/__init__.py +14 -0
  25. aiq/authentication/exceptions/api_key_exceptions.py +38 -0
  26. aiq/authentication/http_basic_auth/__init__.py +0 -0
  27. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
  28. aiq/authentication/http_basic_auth/register.py +30 -0
  29. aiq/authentication/interfaces.py +93 -0
  30. aiq/authentication/oauth2/__init__.py +14 -0
  31. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
  32. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
  33. aiq/authentication/oauth2/register.py +25 -0
  34. aiq/authentication/register.py +21 -0
  35. aiq/builder/__init__.py +0 -0
  36. aiq/builder/builder.py +285 -0
  37. aiq/builder/component_utils.py +316 -0
  38. aiq/builder/context.py +264 -0
  39. aiq/builder/embedder.py +24 -0
  40. aiq/builder/eval_builder.py +161 -0
  41. aiq/builder/evaluator.py +29 -0
  42. aiq/builder/framework_enum.py +24 -0
  43. aiq/builder/front_end.py +73 -0
  44. aiq/builder/function.py +344 -0
  45. aiq/builder/function_base.py +380 -0
  46. aiq/builder/function_info.py +627 -0
  47. aiq/builder/intermediate_step_manager.py +174 -0
  48. aiq/builder/llm.py +25 -0
  49. aiq/builder/retriever.py +25 -0
  50. aiq/builder/user_interaction_manager.py +74 -0
  51. aiq/builder/workflow.py +148 -0
  52. aiq/builder/workflow_builder.py +1117 -0
  53. aiq/cli/__init__.py +14 -0
  54. aiq/cli/cli_utils/__init__.py +0 -0
  55. aiq/cli/cli_utils/config_override.py +231 -0
  56. aiq/cli/cli_utils/validation.py +37 -0
  57. aiq/cli/commands/__init__.py +0 -0
  58. aiq/cli/commands/configure/__init__.py +0 -0
  59. aiq/cli/commands/configure/channel/__init__.py +0 -0
  60. aiq/cli/commands/configure/channel/add.py +28 -0
  61. aiq/cli/commands/configure/channel/channel.py +36 -0
  62. aiq/cli/commands/configure/channel/remove.py +30 -0
  63. aiq/cli/commands/configure/channel/update.py +30 -0
  64. aiq/cli/commands/configure/configure.py +33 -0
  65. aiq/cli/commands/evaluate.py +139 -0
  66. aiq/cli/commands/info/__init__.py +14 -0
  67. aiq/cli/commands/info/info.py +39 -0
  68. aiq/cli/commands/info/list_channels.py +32 -0
  69. aiq/cli/commands/info/list_components.py +129 -0
  70. aiq/cli/commands/info/list_mcp.py +213 -0
  71. aiq/cli/commands/registry/__init__.py +14 -0
  72. aiq/cli/commands/registry/publish.py +88 -0
  73. aiq/cli/commands/registry/pull.py +118 -0
  74. aiq/cli/commands/registry/registry.py +38 -0
  75. aiq/cli/commands/registry/remove.py +108 -0
  76. aiq/cli/commands/registry/search.py +155 -0
  77. aiq/cli/commands/sizing/__init__.py +14 -0
  78. aiq/cli/commands/sizing/calc.py +297 -0
  79. aiq/cli/commands/sizing/sizing.py +27 -0
  80. aiq/cli/commands/start.py +246 -0
  81. aiq/cli/commands/uninstall.py +81 -0
  82. aiq/cli/commands/validate.py +47 -0
  83. aiq/cli/commands/workflow/__init__.py +14 -0
  84. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  85. aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
  86. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
  87. aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
  88. aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
  89. aiq/cli/commands/workflow/workflow.py +37 -0
  90. aiq/cli/commands/workflow/workflow_commands.py +313 -0
  91. aiq/cli/entrypoint.py +135 -0
  92. aiq/cli/main.py +44 -0
  93. aiq/cli/register_workflow.py +488 -0
  94. aiq/cli/type_registry.py +1000 -0
  95. aiq/data_models/__init__.py +14 -0
  96. aiq/data_models/api_server.py +694 -0
  97. aiq/data_models/authentication.py +231 -0
  98. aiq/data_models/common.py +171 -0
  99. aiq/data_models/component.py +54 -0
  100. aiq/data_models/component_ref.py +168 -0
  101. aiq/data_models/config.py +406 -0
  102. aiq/data_models/dataset_handler.py +123 -0
  103. aiq/data_models/discovery_metadata.py +335 -0
  104. aiq/data_models/embedder.py +27 -0
  105. aiq/data_models/evaluate.py +127 -0
  106. aiq/data_models/evaluator.py +26 -0
  107. aiq/data_models/front_end.py +26 -0
  108. aiq/data_models/function.py +30 -0
  109. aiq/data_models/function_dependencies.py +72 -0
  110. aiq/data_models/interactive.py +246 -0
  111. aiq/data_models/intermediate_step.py +302 -0
  112. aiq/data_models/invocation_node.py +38 -0
  113. aiq/data_models/llm.py +27 -0
  114. aiq/data_models/logging.py +26 -0
  115. aiq/data_models/memory.py +27 -0
  116. aiq/data_models/object_store.py +44 -0
  117. aiq/data_models/profiler.py +54 -0
  118. aiq/data_models/registry_handler.py +26 -0
  119. aiq/data_models/retriever.py +30 -0
  120. aiq/data_models/retry_mixin.py +35 -0
  121. aiq/data_models/span.py +187 -0
  122. aiq/data_models/step_adaptor.py +64 -0
  123. aiq/data_models/streaming.py +33 -0
  124. aiq/data_models/swe_bench_model.py +54 -0
  125. aiq/data_models/telemetry_exporter.py +26 -0
  126. aiq/data_models/ttc_strategy.py +30 -0
  127. aiq/embedder/__init__.py +0 -0
  128. aiq/embedder/langchain_client.py +41 -0
  129. aiq/embedder/nim_embedder.py +59 -0
  130. aiq/embedder/openai_embedder.py +43 -0
  131. aiq/embedder/register.py +24 -0
  132. aiq/eval/__init__.py +14 -0
  133. aiq/eval/config.py +60 -0
  134. aiq/eval/dataset_handler/__init__.py +0 -0
  135. aiq/eval/dataset_handler/dataset_downloader.py +106 -0
  136. aiq/eval/dataset_handler/dataset_filter.py +52 -0
  137. aiq/eval/dataset_handler/dataset_handler.py +254 -0
  138. aiq/eval/evaluate.py +506 -0
  139. aiq/eval/evaluator/__init__.py +14 -0
  140. aiq/eval/evaluator/base_evaluator.py +73 -0
  141. aiq/eval/evaluator/evaluator_model.py +45 -0
  142. aiq/eval/intermediate_step_adapter.py +99 -0
  143. aiq/eval/rag_evaluator/__init__.py +0 -0
  144. aiq/eval/rag_evaluator/evaluate.py +178 -0
  145. aiq/eval/rag_evaluator/register.py +143 -0
  146. aiq/eval/register.py +23 -0
  147. aiq/eval/remote_workflow.py +133 -0
  148. aiq/eval/runners/__init__.py +14 -0
  149. aiq/eval/runners/config.py +39 -0
  150. aiq/eval/runners/multi_eval_runner.py +54 -0
  151. aiq/eval/runtime_event_subscriber.py +52 -0
  152. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  153. aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
  154. aiq/eval/swe_bench_evaluator/register.py +36 -0
  155. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  156. aiq/eval/trajectory_evaluator/evaluate.py +75 -0
  157. aiq/eval/trajectory_evaluator/register.py +40 -0
  158. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  159. aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
  160. aiq/eval/tunable_rag_evaluator/register.py +52 -0
  161. aiq/eval/usage_stats.py +41 -0
  162. aiq/eval/utils/__init__.py +0 -0
  163. aiq/eval/utils/output_uploader.py +140 -0
  164. aiq/eval/utils/tqdm_position_registry.py +40 -0
  165. aiq/eval/utils/weave_eval.py +184 -0
  166. aiq/experimental/__init__.py +0 -0
  167. aiq/experimental/decorators/__init__.py +0 -0
  168. aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
  169. aiq/experimental/test_time_compute/__init__.py +0 -0
  170. aiq/experimental/test_time_compute/editing/__init__.py +0 -0
  171. aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
  172. aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
  173. aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
  174. aiq/experimental/test_time_compute/functions/__init__.py +0 -0
  175. aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
  176. aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
  177. aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
  178. aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
  179. aiq/experimental/test_time_compute/models/__init__.py +0 -0
  180. aiq/experimental/test_time_compute/models/editor_config.py +132 -0
  181. aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
  182. aiq/experimental/test_time_compute/models/search_config.py +120 -0
  183. aiq/experimental/test_time_compute/models/selection_config.py +154 -0
  184. aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
  185. aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
  186. aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
  187. aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
  188. aiq/experimental/test_time_compute/register.py +36 -0
  189. aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
  190. aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
  191. aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
  192. aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
  193. aiq/experimental/test_time_compute/search/__init__.py +0 -0
  194. aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
  195. aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
  196. aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
  197. aiq/experimental/test_time_compute/selection/__init__.py +0 -0
  198. aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
  199. aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
  200. aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
  201. aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
  202. aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
  203. aiq/front_ends/__init__.py +14 -0
  204. aiq/front_ends/console/__init__.py +14 -0
  205. aiq/front_ends/console/authentication_flow_handler.py +233 -0
  206. aiq/front_ends/console/console_front_end_config.py +32 -0
  207. aiq/front_ends/console/console_front_end_plugin.py +96 -0
  208. aiq/front_ends/console/register.py +25 -0
  209. aiq/front_ends/cron/__init__.py +14 -0
  210. aiq/front_ends/fastapi/__init__.py +14 -0
  211. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  212. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
  213. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
  214. aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
  215. aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
  216. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
  217. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
  218. aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
  219. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
  220. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
  221. aiq/front_ends/fastapi/job_store.py +183 -0
  222. aiq/front_ends/fastapi/main.py +72 -0
  223. aiq/front_ends/fastapi/message_handler.py +298 -0
  224. aiq/front_ends/fastapi/message_validator.py +345 -0
  225. aiq/front_ends/fastapi/register.py +25 -0
  226. aiq/front_ends/fastapi/response_helpers.py +195 -0
  227. aiq/front_ends/fastapi/step_adaptor.py +321 -0
  228. aiq/front_ends/mcp/__init__.py +14 -0
  229. aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
  230. aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
  231. aiq/front_ends/mcp/register.py +27 -0
  232. aiq/front_ends/mcp/tool_converter.py +242 -0
  233. aiq/front_ends/register.py +22 -0
  234. aiq/front_ends/simple_base/__init__.py +14 -0
  235. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
  236. aiq/llm/__init__.py +0 -0
  237. aiq/llm/aws_bedrock_llm.py +57 -0
  238. aiq/llm/nim_llm.py +46 -0
  239. aiq/llm/openai_llm.py +46 -0
  240. aiq/llm/register.py +23 -0
  241. aiq/llm/utils/__init__.py +14 -0
  242. aiq/llm/utils/env_config_value.py +94 -0
  243. aiq/llm/utils/error.py +17 -0
  244. aiq/memory/__init__.py +20 -0
  245. aiq/memory/interfaces.py +183 -0
  246. aiq/memory/models.py +112 -0
  247. aiq/meta/module_to_distro.json +3 -0
  248. aiq/meta/pypi.md +58 -0
  249. aiq/object_store/__init__.py +20 -0
  250. aiq/object_store/in_memory_object_store.py +76 -0
  251. aiq/object_store/interfaces.py +84 -0
  252. aiq/object_store/models.py +36 -0
  253. aiq/object_store/register.py +20 -0
  254. aiq/observability/__init__.py +14 -0
  255. aiq/observability/exporter/__init__.py +14 -0
  256. aiq/observability/exporter/base_exporter.py +449 -0
  257. aiq/observability/exporter/exporter.py +78 -0
  258. aiq/observability/exporter/file_exporter.py +33 -0
  259. aiq/observability/exporter/processing_exporter.py +322 -0
  260. aiq/observability/exporter/raw_exporter.py +52 -0
  261. aiq/observability/exporter/span_exporter.py +265 -0
  262. aiq/observability/exporter_manager.py +335 -0
  263. aiq/observability/mixin/__init__.py +14 -0
  264. aiq/observability/mixin/batch_config_mixin.py +26 -0
  265. aiq/observability/mixin/collector_config_mixin.py +23 -0
  266. aiq/observability/mixin/file_mixin.py +288 -0
  267. aiq/observability/mixin/file_mode.py +23 -0
  268. aiq/observability/mixin/resource_conflict_mixin.py +134 -0
  269. aiq/observability/mixin/serialize_mixin.py +61 -0
  270. aiq/observability/mixin/type_introspection_mixin.py +183 -0
  271. aiq/observability/processor/__init__.py +14 -0
  272. aiq/observability/processor/batching_processor.py +310 -0
  273. aiq/observability/processor/callback_processor.py +42 -0
  274. aiq/observability/processor/intermediate_step_serializer.py +28 -0
  275. aiq/observability/processor/processor.py +71 -0
  276. aiq/observability/register.py +96 -0
  277. aiq/observability/utils/__init__.py +14 -0
  278. aiq/observability/utils/dict_utils.py +236 -0
  279. aiq/observability/utils/time_utils.py +31 -0
  280. aiq/plugins/.namespace +1 -0
  281. aiq/profiler/__init__.py +0 -0
  282. aiq/profiler/calc/__init__.py +14 -0
  283. aiq/profiler/calc/calc_runner.py +627 -0
  284. aiq/profiler/calc/calculations.py +288 -0
  285. aiq/profiler/calc/data_models.py +188 -0
  286. aiq/profiler/calc/plot.py +345 -0
  287. aiq/profiler/callbacks/__init__.py +0 -0
  288. aiq/profiler/callbacks/agno_callback_handler.py +295 -0
  289. aiq/profiler/callbacks/base_callback_class.py +20 -0
  290. aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
  291. aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
  292. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
  293. aiq/profiler/callbacks/token_usage_base_model.py +27 -0
  294. aiq/profiler/data_frame_row.py +51 -0
  295. aiq/profiler/data_models.py +24 -0
  296. aiq/profiler/decorators/__init__.py +0 -0
  297. aiq/profiler/decorators/framework_wrapper.py +131 -0
  298. aiq/profiler/decorators/function_tracking.py +254 -0
  299. aiq/profiler/forecasting/__init__.py +0 -0
  300. aiq/profiler/forecasting/config.py +18 -0
  301. aiq/profiler/forecasting/model_trainer.py +75 -0
  302. aiq/profiler/forecasting/models/__init__.py +22 -0
  303. aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
  304. aiq/profiler/forecasting/models/linear_model.py +196 -0
  305. aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
  306. aiq/profiler/inference_metrics_model.py +28 -0
  307. aiq/profiler/inference_optimization/__init__.py +0 -0
  308. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  309. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
  310. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
  311. aiq/profiler/inference_optimization/data_models.py +386 -0
  312. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  313. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
  314. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
  315. aiq/profiler/inference_optimization/llm_metrics.py +212 -0
  316. aiq/profiler/inference_optimization/prompt_caching.py +163 -0
  317. aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
  318. aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
  319. aiq/profiler/intermediate_property_adapter.py +102 -0
  320. aiq/profiler/profile_runner.py +473 -0
  321. aiq/profiler/utils.py +184 -0
  322. aiq/registry_handlers/__init__.py +0 -0
  323. aiq/registry_handlers/local/__init__.py +0 -0
  324. aiq/registry_handlers/local/local_handler.py +176 -0
  325. aiq/registry_handlers/local/register_local.py +37 -0
  326. aiq/registry_handlers/metadata_factory.py +60 -0
  327. aiq/registry_handlers/package_utils.py +567 -0
  328. aiq/registry_handlers/pypi/__init__.py +0 -0
  329. aiq/registry_handlers/pypi/pypi_handler.py +251 -0
  330. aiq/registry_handlers/pypi/register_pypi.py +40 -0
  331. aiq/registry_handlers/register.py +21 -0
  332. aiq/registry_handlers/registry_handler_base.py +157 -0
  333. aiq/registry_handlers/rest/__init__.py +0 -0
  334. aiq/registry_handlers/rest/register_rest.py +56 -0
  335. aiq/registry_handlers/rest/rest_handler.py +237 -0
  336. aiq/registry_handlers/schemas/__init__.py +0 -0
  337. aiq/registry_handlers/schemas/headers.py +42 -0
  338. aiq/registry_handlers/schemas/package.py +68 -0
  339. aiq/registry_handlers/schemas/publish.py +63 -0
  340. aiq/registry_handlers/schemas/pull.py +82 -0
  341. aiq/registry_handlers/schemas/remove.py +36 -0
  342. aiq/registry_handlers/schemas/search.py +91 -0
  343. aiq/registry_handlers/schemas/status.py +47 -0
  344. aiq/retriever/__init__.py +0 -0
  345. aiq/retriever/interface.py +37 -0
  346. aiq/retriever/milvus/__init__.py +14 -0
  347. aiq/retriever/milvus/register.py +81 -0
  348. aiq/retriever/milvus/retriever.py +228 -0
  349. aiq/retriever/models.py +74 -0
  350. aiq/retriever/nemo_retriever/__init__.py +14 -0
  351. aiq/retriever/nemo_retriever/register.py +60 -0
  352. aiq/retriever/nemo_retriever/retriever.py +190 -0
  353. aiq/retriever/register.py +22 -0
  354. aiq/runtime/__init__.py +14 -0
  355. aiq/runtime/loader.py +215 -0
  356. aiq/runtime/runner.py +190 -0
  357. aiq/runtime/session.py +158 -0
  358. aiq/runtime/user_metadata.py +130 -0
  359. aiq/settings/__init__.py +0 -0
  360. aiq/settings/global_settings.py +318 -0
  361. aiq/test/.namespace +1 -0
  362. aiq/tool/__init__.py +0 -0
  363. aiq/tool/chat_completion.py +74 -0
  364. aiq/tool/code_execution/README.md +151 -0
  365. aiq/tool/code_execution/__init__.py +0 -0
  366. aiq/tool/code_execution/code_sandbox.py +267 -0
  367. aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
  368. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
  369. aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
  370. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
  371. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
  372. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
  373. aiq/tool/code_execution/register.py +74 -0
  374. aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
  375. aiq/tool/code_execution/utils.py +100 -0
  376. aiq/tool/datetime_tools.py +42 -0
  377. aiq/tool/document_search.py +141 -0
  378. aiq/tool/github_tools/__init__.py +0 -0
  379. aiq/tool/github_tools/create_github_commit.py +133 -0
  380. aiq/tool/github_tools/create_github_issue.py +87 -0
  381. aiq/tool/github_tools/create_github_pr.py +106 -0
  382. aiq/tool/github_tools/get_github_file.py +106 -0
  383. aiq/tool/github_tools/get_github_issue.py +166 -0
  384. aiq/tool/github_tools/get_github_pr.py +256 -0
  385. aiq/tool/github_tools/update_github_issue.py +100 -0
  386. aiq/tool/mcp/__init__.py +14 -0
  387. aiq/tool/mcp/exceptions.py +142 -0
  388. aiq/tool/mcp/mcp_client.py +255 -0
  389. aiq/tool/mcp/mcp_tool.py +96 -0
  390. aiq/tool/memory_tools/__init__.py +0 -0
  391. aiq/tool/memory_tools/add_memory_tool.py +79 -0
  392. aiq/tool/memory_tools/delete_memory_tool.py +67 -0
  393. aiq/tool/memory_tools/get_memory_tool.py +72 -0
  394. aiq/tool/nvidia_rag.py +95 -0
  395. aiq/tool/register.py +38 -0
  396. aiq/tool/retriever.py +89 -0
  397. aiq/tool/server_tools.py +66 -0
  398. aiq/utils/__init__.py +0 -0
  399. aiq/utils/data_models/__init__.py +0 -0
  400. aiq/utils/data_models/schema_validator.py +58 -0
  401. aiq/utils/debugging_utils.py +43 -0
  402. aiq/utils/dump_distro_mapping.py +32 -0
  403. aiq/utils/exception_handlers/__init__.py +0 -0
  404. aiq/utils/exception_handlers/automatic_retries.py +289 -0
  405. aiq/utils/exception_handlers/mcp.py +211 -0
  406. aiq/utils/exception_handlers/schemas.py +114 -0
  407. aiq/utils/io/__init__.py +0 -0
  408. aiq/utils/io/model_processing.py +28 -0
  409. aiq/utils/io/yaml_tools.py +119 -0
  410. aiq/utils/log_utils.py +37 -0
  411. aiq/utils/metadata_utils.py +74 -0
  412. aiq/utils/optional_imports.py +142 -0
  413. aiq/utils/producer_consumer_queue.py +178 -0
  414. aiq/utils/reactive/__init__.py +0 -0
  415. aiq/utils/reactive/base/__init__.py +0 -0
  416. aiq/utils/reactive/base/observable_base.py +65 -0
  417. aiq/utils/reactive/base/observer_base.py +55 -0
  418. aiq/utils/reactive/base/subject_base.py +79 -0
  419. aiq/utils/reactive/observable.py +59 -0
  420. aiq/utils/reactive/observer.py +76 -0
  421. aiq/utils/reactive/subject.py +131 -0
  422. aiq/utils/reactive/subscription.py +49 -0
  423. aiq/utils/settings/__init__.py +0 -0
  424. aiq/utils/settings/global_settings.py +197 -0
  425. aiq/utils/string_utils.py +38 -0
  426. aiq/utils/type_converter.py +290 -0
  427. aiq/utils/type_utils.py +484 -0
  428. aiq/utils/url_utils.py +27 -0
  429. nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
  430. nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
  431. nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
  432. nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
  433. nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
  434. nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
  435. nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
@@ -0,0 +1,168 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import re
19
+
20
+ from aiq.builder.builder import Builder
21
+ from aiq.builder.framework_enum import LLMFrameworkEnum
22
+ from aiq.cli.register_workflow import register_ttc_strategy
23
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
24
+ from aiq.experimental.test_time_compute.models.scoring_config import LLMBasedPlanScoringConfig
25
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
26
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
27
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
28
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
29
+ from aiq.utils.io.model_processing import remove_r1_think_tags
30
+
31
+ logger = logging.getLogger(__name__)
32
+
33
+
34
+ class LLMBasedPlanScorer(StrategyBase):
35
+
36
+ def __init__(self, config: TTCStrategyBaseConfig) -> None:
37
+ super().__init__(config)
38
+ self.llm_bound = None
39
+
40
+ async def build_components(self, builder: Builder) -> None:
41
+ """
42
+ Build the components required for the planner.
43
+ """
44
+ self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
45
+
46
+ def supported_pipeline_types(self) -> [PipelineTypeEnum]:
47
+ return [PipelineTypeEnum.PLANNING]
48
+
49
+ def stage_type(self) -> StageTypeEnum:
50
+ return StageTypeEnum.SCORING
51
+
52
+ async def score_single(self, original_prompt: str, agent_context: str, planning_item: TTCItem) -> float:
53
+ """
54
+ Score a single planning item using the LLM.
55
+
56
+ Args:
57
+ original_prompt (str): The original prompt.
58
+ agent_context (str): The agent context.
59
+ planning_item (TTCItem): The item to score.
60
+
61
+ Returns:
62
+ float: The score of the item.
63
+ """
64
+
65
+ try:
66
+ from langchain_core.language_models import BaseChatModel
67
+ from langchain_core.prompts import PromptTemplate
68
+ except ImportError:
69
+ raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
70
+ "This error can be resolved by installing aiqtoolkit-langchain.")
71
+
72
+ if not isinstance(self.llm_bound, BaseChatModel):
73
+ raise ValueError("The `scoring_llm` must be an instance of `BaseChatModel`.")
74
+
75
+ model: BaseChatModel = self.llm_bound
76
+
77
+ prompt_template = PromptTemplate(
78
+ template=self.config.scoring_template,
79
+ input_variables=["original_prompt", "context", "plan"],
80
+ validate_template=True,
81
+ )
82
+
83
+ prompt = (await prompt_template.ainvoke(
84
+ input={
85
+ "original_prompt": original_prompt,
86
+ "context": agent_context,
87
+ "plan": remove_r1_think_tags(planning_item.plan)
88
+ }))
89
+
90
+ response = (await model.ainvoke(prompt)).content
91
+
92
+ # Score will following the format of `FINAL SCORE: <float>` in the response from the LLM
93
+ if not isinstance(response, str):
94
+ logger.warning(f"Invalid response from LLM for scoring: {response}.")
95
+ raise ValueError("Unable to parse the score from the LLM response.")
96
+
97
+ response = response.strip()
98
+ match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
99
+ if not match:
100
+ logger.warning(f"Could not parse the score from the response: {response}.")
101
+ score_str = '0.0'
102
+ else:
103
+ score_str = match.group(1)
104
+
105
+ try:
106
+ score = float(score_str)
107
+ except ValueError:
108
+ logger.warning(f"Could not convert the score string '{score_str}' to float.")
109
+ raise ValueError(f"Unable to convert the extracted score '{score_str}' to a float.")
110
+
111
+ return score
112
+
113
+ async def ainvoke(self,
114
+ items: list[TTCItem],
115
+ original_prompt: str | None = None,
116
+ agent_context: str | None = None,
117
+ **kwargs) -> list[TTCItem]:
118
+ """
119
+ Score a list of planning items.
120
+
121
+ Args:
122
+ original_prompt (str): The original prompt.
123
+ agent_context (str): The agent context.
124
+ items (list[TTCItem]): The list of planning items to score.
125
+
126
+ Returns:
127
+ list[float]: A list of scores corresponding to each planning item.
128
+ """
129
+ # Run score single concurrently for all planning items
130
+ # Then set the score attribute on each planning item
131
+ if not items:
132
+ return []
133
+ tasks = [
134
+ self.score_single(original_prompt=original_prompt, agent_context=agent_context, planning_item=item)
135
+ for item in items
136
+ ]
137
+
138
+ # Gather all scores concurrently
139
+ scores = await asyncio.gather(*tasks)
140
+
141
+ if len(scores) != len(items):
142
+ logger.warning(f"Number of scores {len(scores)} does not match the number of planning items {len(items)}.")
143
+ raise ValueError("Mismatch in number of scores and planning items.")
144
+
145
+ logger.debug("Scores for planning items: %s", scores)
146
+
147
+ # Set the score on each planning item for reference
148
+ for idx, score in enumerate(scores):
149
+ items[idx].score = score
150
+
151
+ return items
152
+
153
+
154
+ @register_ttc_strategy(config_type=LLMBasedPlanScoringConfig)
155
+ async def register_llm_based_plan_scorer(config: LLMBasedPlanScoringConfig, builder: Builder):
156
+ """
157
+ Register the LLM-based plan scorer strategy.
158
+
159
+ Args:
160
+ config (LLMBasedPlanScoringConfig): The configuration for the strategy.
161
+ builder (Builder): The builder instance.
162
+
163
+ Returns:
164
+ LLMBasedPlanScorer: The registered LLM-based plan scorer.
165
+ """
166
+ scorer = LLMBasedPlanScorer(config)
167
+ await scorer.build_components(builder)
168
+ yield scorer
@@ -0,0 +1,111 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import re
19
+
20
+ from aiq.builder.builder import Builder
21
+ from aiq.builder.framework_enum import LLMFrameworkEnum
22
+ from aiq.cli.register_workflow import register_ttc_strategy
23
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
24
+ from aiq.experimental.test_time_compute.models.scoring_config import MotivationAwareScoringConfig
25
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
26
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
27
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
28
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
29
+ from aiq.utils.io.model_processing import remove_r1_think_tags
30
+
31
+ logger = logging.getLogger(__name__)
32
+
33
+
34
+ class MotivationAwareScorer(StrategyBase):
35
+ """
36
+ A strategy that scores an TTCItem's output based on how well it
37
+ addresses both the original input (task) and the 'motivation' from metadata.
38
+ """
39
+
40
+ def __init__(self, config: TTCStrategyBaseConfig) -> None:
41
+ super().__init__(config)
42
+ self.llm_bound = None
43
+
44
+ async def build_components(self, builder: Builder) -> None:
45
+ self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
46
+
47
+ def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
48
+ return [PipelineTypeEnum.TOOL_USE]
49
+
50
+ def stage_type(self) -> StageTypeEnum:
51
+ return StageTypeEnum.SCORING
52
+
53
+ async def ainvoke(self,
54
+ items: list[TTCItem],
55
+ original_prompt: str | None = None,
56
+ agent_context: str | None = None,
57
+ **kwargs) -> list[TTCItem]:
58
+ """
59
+ Scores each item by combining the original 'task_description' and 'motivation' with the 'output'.
60
+ The resulting score is stored in item.score.
61
+ """
62
+ from langchain_core.language_models import BaseChatModel
63
+ from langchain_core.prompts import PromptTemplate
64
+
65
+ if not isinstance(self.llm_bound, BaseChatModel):
66
+ raise ValueError("scoring_llm must be a BaseChatModel instance for MotivationAwareScorer.")
67
+
68
+ scoring_model: BaseChatModel = self.llm_bound
69
+
70
+ scoring_template = PromptTemplate(template=self.config.scoring_template,
71
+ input_variables=["task", "motivation", "output"],
72
+ validate_template=True)
73
+
74
+ async def score_item(item: TTCItem) -> float:
75
+ task_str = str(item.input) or ""
76
+ motivation_str = str(item.metadata) if item.metadata else ""
77
+ output_str = str(item.output) or ""
78
+
79
+ prompt = (await scoring_template.ainvoke({
80
+ "task": task_str, "motivation": motivation_str, "output": output_str
81
+ })).to_string()
82
+
83
+ response = (await scoring_model.ainvoke(prompt)).content
84
+ response = remove_r1_think_tags(response or "")
85
+
86
+ match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
87
+ if not match:
88
+ logger.warning(f"Could not parse score from response: {response}")
89
+ return 0.0
90
+
91
+ score_str = match.group(1)
92
+ try:
93
+ return float(score_str)
94
+ except ValueError:
95
+ logger.warning(f"Could not convert score '{score_str}' to float.")
96
+ return 0.0
97
+
98
+ tasks = [score_item(item) for item in items]
99
+ scores = await asyncio.gather(*tasks)
100
+
101
+ for i, s in enumerate(scores):
102
+ items[i].score = s
103
+
104
+ return items
105
+
106
+
107
+ @register_ttc_strategy(config_type=MotivationAwareScoringConfig)
108
+ async def register_motivation_aware_scorer(config: MotivationAwareScoringConfig, builder: Builder):
109
+ scorer = MotivationAwareScorer(config)
110
+ await scorer.build_components(builder)
111
+ yield scorer
File without changes
@@ -0,0 +1,128 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import re
19
+
20
+ from aiq.builder.builder import Builder
21
+ from aiq.builder.framework_enum import LLMFrameworkEnum
22
+ from aiq.cli.register_workflow import register_ttc_strategy
23
+ from aiq.experimental.test_time_compute.models.search_config import MultiLLMPlanConfig
24
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
25
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
26
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
27
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
28
+ from aiq.utils.io.model_processing import remove_r1_think_tags
29
+
30
+ logger = logging.getLogger(__name__)
31
+
32
+
33
+ class MultiLLMPlanner(StrategyBase):
34
+ """
35
+ A planner that uses multiple LLMs to generate plans. Each LLM can generate
36
+ a specified number of plans, and all plans are combined.
37
+ """
38
+
39
+ def __init__(self, config: MultiLLMPlanConfig) -> None:
40
+ super().__init__(config)
41
+ self.config = config
42
+ self.llms_bound = [] # Will hold the "bound" LLMs after build_components
43
+
44
+ async def build_components(self, builder: Builder) -> None:
45
+ """
46
+ Build the components required for this multi-LLM planner.
47
+ Binds each LLMRef from the config with the selected framework wrapper (LANGCHAIN).
48
+ """
49
+ logger.debug("Building components for MultiLLMPlanner")
50
+ self.llms_bound = []
51
+ for llm_ref in self.config.llms:
52
+ bound_llm = await builder.get_llm(llm_ref, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
53
+ self.llms_bound.append(bound_llm)
54
+
55
+ def supported_pipeline_types(self) -> [PipelineTypeEnum]:
56
+ return [PipelineTypeEnum.PLANNING]
57
+
58
+ def stage_type(self) -> StageTypeEnum:
59
+ return StageTypeEnum.SEARCH
60
+
61
+ async def _generate_plan_for_temperature(self, llm, base_prompt: str, temperature: float) -> TTCItem:
62
+ bound_llm = llm.bind(temperature=temperature)
63
+ response = await bound_llm.ainvoke(base_prompt)
64
+ cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
65
+ # The plan is expected to start with "PLAN:" and all the text after it is the plan
66
+ cleaned = re.sub(r'(?i)^\s*PLAN:\s*', '', cleaned).strip()
67
+
68
+ if not cleaned:
69
+ logger.warning(f"No plan generated for the prompt: {base_prompt}.")
70
+ # Return an empty PlanningItem to avoid breaking the generation loop
71
+ return TTCItem(plan="Plan was not generated")
72
+
73
+ return TTCItem(plan=cleaned)
74
+
75
+ async def _generate_plans_for_llm(self, llm, base_prompt: str) -> list[TTCItem]:
76
+ if self.config.plans_per_llm == 1:
77
+ temps = [self.config.min_temperature]
78
+ else:
79
+ temps = [
80
+ self.config.min_temperature + (i / (self.config.plans_per_llm - 1)) *
81
+ (self.config.max_temperature - self.config.min_temperature) for i in range(self.config.plans_per_llm)
82
+ ]
83
+ tasks = [self._generate_plan_for_temperature(llm, base_prompt, temp) for temp in temps]
84
+ return await asyncio.gather(*tasks)
85
+
86
+ async def ainvoke(self,
87
+ items: list[TTCItem],
88
+ original_prompt: str | None = None,
89
+ agent_context: str | None = None,
90
+ **kwargs) -> list[TTCItem]:
91
+ """
92
+ Generate a list of PlanningItems by querying each LLM in self.llms_bound.
93
+ Each LLM produces 'plans_per_llm' plans.
94
+ """
95
+ try:
96
+ from langchain_core.prompts import PromptTemplate
97
+ except ImportError:
98
+ raise ImportError("langchain-core is not installed. Please install it to use MultiLLMPlanner.\n"
99
+ "This error can be resolve by installing aiqtoolkit-langchain.")
100
+
101
+ # Create a single PromptTemplate
102
+ planning_template = PromptTemplate(template=self.config.planning_template,
103
+ input_variables=["context", "prompt"],
104
+ validate_template=True)
105
+
106
+ # Format the prompt once
107
+ base_prompt = (await planning_template.ainvoke({
108
+ "context": agent_context, "prompt": original_prompt
109
+ })).to_string()
110
+
111
+ # Launch generation for each llm concurrently using the new helper method
112
+ tasks = [self._generate_plans_for_llm(llm, base_prompt) for llm in self.llms_bound]
113
+ results_nested = await asyncio.gather(*tasks)
114
+
115
+ # Flatten the nested lists of TTCItem
116
+ all_plans: list[TTCItem] = [p for sub in results_nested for p in sub]
117
+ logger.info("MultiLLMPlanner generated %d plans total.", len(all_plans))
118
+ return all_plans
119
+
120
+
121
+ @register_ttc_strategy(config_type=MultiLLMPlanConfig)
122
+ async def register_multi_llm_planner(config: MultiLLMPlanConfig, builder: Builder):
123
+ """
124
+ Register the MultiLLMPlanner strategy with the provided configuration.
125
+ """
126
+ planner = MultiLLMPlanner(config)
127
+ await planner.build_components(builder)
128
+ yield planner
@@ -0,0 +1,122 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import logging
17
+
18
+ from aiq.builder.builder import Builder
19
+ from aiq.builder.framework_enum import LLMFrameworkEnum
20
+ from aiq.cli.register_workflow import register_ttc_strategy
21
+ from aiq.experimental.test_time_compute.models.search_config import MultiQueryRetrievalSearchConfig
22
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
23
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
24
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
25
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
26
+ from aiq.utils.io.model_processing import remove_r1_think_tags
27
+
28
+ logger = logging.getLogger(__name__)
29
+
30
+
31
+ class MultiQueryRetrievalSearch(StrategyBase):
32
+ """
33
+ A strategy that, for each incoming TTCItem, generates multiple new items by
34
+ re-writing the input 'task_description' from different perspectives.
35
+ Uses multiple LLMs to encourage diversity.
36
+ """
37
+
38
+ def __init__(self, config: MultiQueryRetrievalSearchConfig) -> None:
39
+ super().__init__(config)
40
+ self.config = config
41
+ self.llms_bound = []
42
+
43
+ async def build_components(self, builder: Builder) -> None:
44
+ """
45
+ Binds each LLMRef in self.config.llms to an actual LLM client.
46
+ """
47
+ self.llms_bound = []
48
+ for llm_ref in self.config.llms:
49
+ bound_llm = await builder.get_llm(llm_ref, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
50
+ self.llms_bound.append(bound_llm)
51
+
52
+ def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
53
+ return [PipelineTypeEnum.TOOL_USE]
54
+
55
+ def stage_type(self) -> StageTypeEnum:
56
+ return StageTypeEnum.SEARCH
57
+
58
+ async def ainvoke(self,
59
+ items: list[TTCItem],
60
+ original_prompt: str | None = None,
61
+ agent_context: str | None = None,
62
+ **kwargs) -> list[TTCItem]:
63
+ """
64
+ For each TTCItem, rewrite the 'input' using each LLM to create a new perspective.
65
+ The new TTCItems' 'output' field will store the newly generated query.
66
+ """
67
+ try:
68
+ from langchain_core.prompts import PromptTemplate
69
+ except ImportError:
70
+ raise ImportError("langchain-core is required for MultiQueryRetrievalSearch. "
71
+ "Install aiqtoolkit-langchain or similar.")
72
+
73
+ new_ttc_items: list[TTCItem] = []
74
+
75
+ # Create a single PromptTemplate object for rewriting the query
76
+ template_vars = ["task", "motivation"]
77
+ query_template = PromptTemplate(template=self.config.query_generation_template,
78
+ input_variables=template_vars,
79
+ validate_template=True)
80
+
81
+ for item in items:
82
+ original_task = str(item.input) or ""
83
+ motivation = str(item.metadata) if item.metadata else ""
84
+ new_ttc_items.append(
85
+ TTCItem(
86
+ input=item.input,
87
+ output=item.input,
88
+ metadata=item.metadata,
89
+ name=item.name, # keep the original tool name
90
+ ))
91
+
92
+ for llm in self.llms_bound:
93
+ prompt_str = (await query_template.ainvoke({
94
+ "task": original_task, "motivation": motivation
95
+ })).to_string()
96
+
97
+ # We'll call each LLM to produce a new query
98
+ response = await llm.ainvoke(prompt_str)
99
+ cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
100
+ cleaned = cleaned.strip()
101
+
102
+ # Create a new TTCItem for each newly generated query
103
+ new_item = TTCItem(
104
+ input=item.input, # keep the original input for reference
105
+ output=cleaned, # store the newly generated query in the output
106
+ metadata=item.metadata,
107
+ name=item.name, # same tool name or optional new name
108
+ )
109
+ new_ttc_items.append(new_item)
110
+
111
+ logger.info("MultiQueryRetrievalSearch produced %d new items from %d original items.",
112
+ len(new_ttc_items),
113
+ len(items))
114
+
115
+ return new_ttc_items
116
+
117
+
118
+ @register_ttc_strategy(config_type=MultiQueryRetrievalSearchConfig)
119
+ async def register_multi_query_retrieval_search(config: MultiQueryRetrievalSearchConfig, builder: Builder):
120
+ strategy = MultiQueryRetrievalSearch(config)
121
+ await strategy.build_components(builder)
122
+ yield strategy
@@ -0,0 +1,128 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import re
19
+
20
+ from aiq.builder.builder import Builder
21
+ from aiq.builder.framework_enum import LLMFrameworkEnum
22
+ from aiq.cli.register_workflow import register_ttc_strategy
23
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
24
+ from aiq.experimental.test_time_compute.models.search_config import SingleShotMultiPlanConfig
25
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
26
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
27
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
28
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
29
+ from aiq.utils.io.model_processing import remove_r1_think_tags
30
+
31
+ logger = logging.getLogger(__name__)
32
+
33
+
34
+ class SingleShotMultiPlanPlanner(StrategyBase):
35
+ """
36
+ Implementation of the Single Shot Multi Plan Planner.
37
+ This planner generates multiple plans in a single shot.
38
+ """
39
+
40
+ def __init__(self, config: TTCStrategyBaseConfig) -> None:
41
+ super().__init__(config)
42
+ self.llm_bound = None
43
+
44
+ async def build_components(self, builder: Builder) -> None:
45
+ self.llm_bound = await builder.get_llm(self.config.planning_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
46
+
47
+ def supported_pipeline_types(self) -> [PipelineTypeEnum]:
48
+ return [PipelineTypeEnum.PLANNING]
49
+
50
+ def stage_type(self) -> StageTypeEnum:
51
+ return StageTypeEnum.SEARCH
52
+
53
+ async def ainvoke(self,
54
+ items: list[TTCItem],
55
+ original_prompt: str | None = None,
56
+ agent_context: str | None = None,
57
+ **kwargs) -> list[TTCItem]:
58
+ """
59
+ Generate a TTCItem based on the provided prompt.
60
+ """
61
+
62
+ try:
63
+ from langchain_core.language_models import BaseChatModel
64
+ from langchain_core.prompts import PromptTemplate
65
+ except ImportError:
66
+ raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
67
+ "This error can be resolve by installing aiqtoolkit-langchain.")
68
+
69
+ planning_template = PromptTemplate(template=self.config.planning_template,
70
+ input_variables=["context", "prompt"],
71
+ validate_template=True)
72
+ prompt = (await planning_template.ainvoke(input={
73
+ "context": agent_context, "prompt": original_prompt
74
+ })).to_string()
75
+
76
+ # assert self.config.planning llm is a BaseChatModel
77
+ if not isinstance(self.llm_bound, BaseChatModel):
78
+ raise ValueError("The `planning_llm` must be an instance of `BaseChatModel`.")
79
+
80
+ model: BaseChatModel = self.llm_bound
81
+
82
+ async def generate_plan(llm: BaseChatModel, plan_prompt: str, temperature: float) -> TTCItem:
83
+ """
84
+ Helper function to generate a plan using the provided prompt and temperature.
85
+ """
86
+ llm_bound = llm.bind(temperature=temperature)
87
+ response = await llm_bound.ainvoke(plan_prompt)
88
+ cleaned = remove_r1_think_tags(response.content if hasattr(response, 'content') else str(response))
89
+
90
+ # Plan will be the string following 'PLAN:'. Use Regex tpo extract
91
+ cleaned = re.sub(r'(?i)^\s*PLAN:\s*', '', cleaned).strip()
92
+
93
+ if not cleaned:
94
+ logger.warning(f"No plan generated for the prompt: {plan_prompt}.")
95
+ # Return an empty PlanningItem to avoid breaking the generation loop
96
+ return TTCItem(plan="Plan was not generated")
97
+
98
+ return TTCItem(plan=cleaned)
99
+
100
+ # Define a list of temperatures based on min and max temperature in the config and number of plans to generate
101
+ temperatures = [
102
+ self.config.min_temperature + (i / (self.config.num_plans - 1)) *
103
+ (self.config.max_temperature - self.config.min_temperature) for i in range(self.config.num_plans)
104
+ ]
105
+
106
+ # Generate plans using the defined temperatures in parallel using asyncio
107
+ tasks = [generate_plan(model, prompt, temperature) for temperature in temperatures]
108
+ # Run the tasks concurrently and gather results
109
+ plans = await asyncio.gather(*tasks)
110
+
111
+ if not plans:
112
+ raise ValueError("No plans were generated. Please check the LLM response.")
113
+
114
+ logger.info("Generated %d plans from the SingleShotMultiPlanPlanner", self.config.num_plans)
115
+
116
+ logger.debug("Generated plans: %s", [plan.dict() for plan in plans])
117
+
118
+ return plans
119
+
120
+
121
+ @register_ttc_strategy(config_type=SingleShotMultiPlanConfig)
122
+ async def register_single_shot_multi_plan_planner(config: SingleShotMultiPlanConfig, builder: Builder):
123
+ """
124
+ Register the SingleShotMultiPlanPlanner strategy with the provided configuration.
125
+ """
126
+ planner = SingleShotMultiPlanPlanner(config)
127
+ await planner.build_components(builder)
128
+ yield planner