nvidia-nat 1.2.0rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (435) hide show
  1. aiq/agent/__init__.py +0 -0
  2. aiq/agent/base.py +239 -0
  3. aiq/agent/dual_node.py +67 -0
  4. aiq/agent/react_agent/__init__.py +0 -0
  5. aiq/agent/react_agent/agent.py +355 -0
  6. aiq/agent/react_agent/output_parser.py +104 -0
  7. aiq/agent/react_agent/prompt.py +41 -0
  8. aiq/agent/react_agent/register.py +149 -0
  9. aiq/agent/reasoning_agent/__init__.py +0 -0
  10. aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
  11. aiq/agent/register.py +23 -0
  12. aiq/agent/rewoo_agent/__init__.py +0 -0
  13. aiq/agent/rewoo_agent/agent.py +411 -0
  14. aiq/agent/rewoo_agent/prompt.py +108 -0
  15. aiq/agent/rewoo_agent/register.py +158 -0
  16. aiq/agent/tool_calling_agent/__init__.py +0 -0
  17. aiq/agent/tool_calling_agent/agent.py +119 -0
  18. aiq/agent/tool_calling_agent/register.py +106 -0
  19. aiq/authentication/__init__.py +14 -0
  20. aiq/authentication/api_key/__init__.py +14 -0
  21. aiq/authentication/api_key/api_key_auth_provider.py +96 -0
  22. aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
  23. aiq/authentication/api_key/register.py +26 -0
  24. aiq/authentication/exceptions/__init__.py +14 -0
  25. aiq/authentication/exceptions/api_key_exceptions.py +38 -0
  26. aiq/authentication/http_basic_auth/__init__.py +0 -0
  27. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
  28. aiq/authentication/http_basic_auth/register.py +30 -0
  29. aiq/authentication/interfaces.py +93 -0
  30. aiq/authentication/oauth2/__init__.py +14 -0
  31. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
  32. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
  33. aiq/authentication/oauth2/register.py +25 -0
  34. aiq/authentication/register.py +21 -0
  35. aiq/builder/__init__.py +0 -0
  36. aiq/builder/builder.py +285 -0
  37. aiq/builder/component_utils.py +316 -0
  38. aiq/builder/context.py +264 -0
  39. aiq/builder/embedder.py +24 -0
  40. aiq/builder/eval_builder.py +161 -0
  41. aiq/builder/evaluator.py +29 -0
  42. aiq/builder/framework_enum.py +24 -0
  43. aiq/builder/front_end.py +73 -0
  44. aiq/builder/function.py +344 -0
  45. aiq/builder/function_base.py +380 -0
  46. aiq/builder/function_info.py +627 -0
  47. aiq/builder/intermediate_step_manager.py +174 -0
  48. aiq/builder/llm.py +25 -0
  49. aiq/builder/retriever.py +25 -0
  50. aiq/builder/user_interaction_manager.py +74 -0
  51. aiq/builder/workflow.py +148 -0
  52. aiq/builder/workflow_builder.py +1117 -0
  53. aiq/cli/__init__.py +14 -0
  54. aiq/cli/cli_utils/__init__.py +0 -0
  55. aiq/cli/cli_utils/config_override.py +231 -0
  56. aiq/cli/cli_utils/validation.py +37 -0
  57. aiq/cli/commands/__init__.py +0 -0
  58. aiq/cli/commands/configure/__init__.py +0 -0
  59. aiq/cli/commands/configure/channel/__init__.py +0 -0
  60. aiq/cli/commands/configure/channel/add.py +28 -0
  61. aiq/cli/commands/configure/channel/channel.py +36 -0
  62. aiq/cli/commands/configure/channel/remove.py +30 -0
  63. aiq/cli/commands/configure/channel/update.py +30 -0
  64. aiq/cli/commands/configure/configure.py +33 -0
  65. aiq/cli/commands/evaluate.py +139 -0
  66. aiq/cli/commands/info/__init__.py +14 -0
  67. aiq/cli/commands/info/info.py +39 -0
  68. aiq/cli/commands/info/list_channels.py +32 -0
  69. aiq/cli/commands/info/list_components.py +129 -0
  70. aiq/cli/commands/info/list_mcp.py +213 -0
  71. aiq/cli/commands/registry/__init__.py +14 -0
  72. aiq/cli/commands/registry/publish.py +88 -0
  73. aiq/cli/commands/registry/pull.py +118 -0
  74. aiq/cli/commands/registry/registry.py +38 -0
  75. aiq/cli/commands/registry/remove.py +108 -0
  76. aiq/cli/commands/registry/search.py +155 -0
  77. aiq/cli/commands/sizing/__init__.py +14 -0
  78. aiq/cli/commands/sizing/calc.py +297 -0
  79. aiq/cli/commands/sizing/sizing.py +27 -0
  80. aiq/cli/commands/start.py +246 -0
  81. aiq/cli/commands/uninstall.py +81 -0
  82. aiq/cli/commands/validate.py +47 -0
  83. aiq/cli/commands/workflow/__init__.py +14 -0
  84. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  85. aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
  86. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
  87. aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
  88. aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
  89. aiq/cli/commands/workflow/workflow.py +37 -0
  90. aiq/cli/commands/workflow/workflow_commands.py +313 -0
  91. aiq/cli/entrypoint.py +135 -0
  92. aiq/cli/main.py +44 -0
  93. aiq/cli/register_workflow.py +488 -0
  94. aiq/cli/type_registry.py +1000 -0
  95. aiq/data_models/__init__.py +14 -0
  96. aiq/data_models/api_server.py +694 -0
  97. aiq/data_models/authentication.py +231 -0
  98. aiq/data_models/common.py +171 -0
  99. aiq/data_models/component.py +54 -0
  100. aiq/data_models/component_ref.py +168 -0
  101. aiq/data_models/config.py +406 -0
  102. aiq/data_models/dataset_handler.py +123 -0
  103. aiq/data_models/discovery_metadata.py +335 -0
  104. aiq/data_models/embedder.py +27 -0
  105. aiq/data_models/evaluate.py +127 -0
  106. aiq/data_models/evaluator.py +26 -0
  107. aiq/data_models/front_end.py +26 -0
  108. aiq/data_models/function.py +30 -0
  109. aiq/data_models/function_dependencies.py +72 -0
  110. aiq/data_models/interactive.py +246 -0
  111. aiq/data_models/intermediate_step.py +302 -0
  112. aiq/data_models/invocation_node.py +38 -0
  113. aiq/data_models/llm.py +27 -0
  114. aiq/data_models/logging.py +26 -0
  115. aiq/data_models/memory.py +27 -0
  116. aiq/data_models/object_store.py +44 -0
  117. aiq/data_models/profiler.py +54 -0
  118. aiq/data_models/registry_handler.py +26 -0
  119. aiq/data_models/retriever.py +30 -0
  120. aiq/data_models/retry_mixin.py +35 -0
  121. aiq/data_models/span.py +187 -0
  122. aiq/data_models/step_adaptor.py +64 -0
  123. aiq/data_models/streaming.py +33 -0
  124. aiq/data_models/swe_bench_model.py +54 -0
  125. aiq/data_models/telemetry_exporter.py +26 -0
  126. aiq/data_models/ttc_strategy.py +30 -0
  127. aiq/embedder/__init__.py +0 -0
  128. aiq/embedder/langchain_client.py +41 -0
  129. aiq/embedder/nim_embedder.py +59 -0
  130. aiq/embedder/openai_embedder.py +43 -0
  131. aiq/embedder/register.py +24 -0
  132. aiq/eval/__init__.py +14 -0
  133. aiq/eval/config.py +60 -0
  134. aiq/eval/dataset_handler/__init__.py +0 -0
  135. aiq/eval/dataset_handler/dataset_downloader.py +106 -0
  136. aiq/eval/dataset_handler/dataset_filter.py +52 -0
  137. aiq/eval/dataset_handler/dataset_handler.py +254 -0
  138. aiq/eval/evaluate.py +506 -0
  139. aiq/eval/evaluator/__init__.py +14 -0
  140. aiq/eval/evaluator/base_evaluator.py +73 -0
  141. aiq/eval/evaluator/evaluator_model.py +45 -0
  142. aiq/eval/intermediate_step_adapter.py +99 -0
  143. aiq/eval/rag_evaluator/__init__.py +0 -0
  144. aiq/eval/rag_evaluator/evaluate.py +178 -0
  145. aiq/eval/rag_evaluator/register.py +143 -0
  146. aiq/eval/register.py +23 -0
  147. aiq/eval/remote_workflow.py +133 -0
  148. aiq/eval/runners/__init__.py +14 -0
  149. aiq/eval/runners/config.py +39 -0
  150. aiq/eval/runners/multi_eval_runner.py +54 -0
  151. aiq/eval/runtime_event_subscriber.py +52 -0
  152. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  153. aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
  154. aiq/eval/swe_bench_evaluator/register.py +36 -0
  155. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  156. aiq/eval/trajectory_evaluator/evaluate.py +75 -0
  157. aiq/eval/trajectory_evaluator/register.py +40 -0
  158. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  159. aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
  160. aiq/eval/tunable_rag_evaluator/register.py +52 -0
  161. aiq/eval/usage_stats.py +41 -0
  162. aiq/eval/utils/__init__.py +0 -0
  163. aiq/eval/utils/output_uploader.py +140 -0
  164. aiq/eval/utils/tqdm_position_registry.py +40 -0
  165. aiq/eval/utils/weave_eval.py +184 -0
  166. aiq/experimental/__init__.py +0 -0
  167. aiq/experimental/decorators/__init__.py +0 -0
  168. aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
  169. aiq/experimental/test_time_compute/__init__.py +0 -0
  170. aiq/experimental/test_time_compute/editing/__init__.py +0 -0
  171. aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
  172. aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
  173. aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
  174. aiq/experimental/test_time_compute/functions/__init__.py +0 -0
  175. aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
  176. aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
  177. aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
  178. aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
  179. aiq/experimental/test_time_compute/models/__init__.py +0 -0
  180. aiq/experimental/test_time_compute/models/editor_config.py +132 -0
  181. aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
  182. aiq/experimental/test_time_compute/models/search_config.py +120 -0
  183. aiq/experimental/test_time_compute/models/selection_config.py +154 -0
  184. aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
  185. aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
  186. aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
  187. aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
  188. aiq/experimental/test_time_compute/register.py +36 -0
  189. aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
  190. aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
  191. aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
  192. aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
  193. aiq/experimental/test_time_compute/search/__init__.py +0 -0
  194. aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
  195. aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
  196. aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
  197. aiq/experimental/test_time_compute/selection/__init__.py +0 -0
  198. aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
  199. aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
  200. aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
  201. aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
  202. aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
  203. aiq/front_ends/__init__.py +14 -0
  204. aiq/front_ends/console/__init__.py +14 -0
  205. aiq/front_ends/console/authentication_flow_handler.py +233 -0
  206. aiq/front_ends/console/console_front_end_config.py +32 -0
  207. aiq/front_ends/console/console_front_end_plugin.py +96 -0
  208. aiq/front_ends/console/register.py +25 -0
  209. aiq/front_ends/cron/__init__.py +14 -0
  210. aiq/front_ends/fastapi/__init__.py +14 -0
  211. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  212. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
  213. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
  214. aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
  215. aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
  216. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
  217. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
  218. aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
  219. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
  220. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
  221. aiq/front_ends/fastapi/job_store.py +183 -0
  222. aiq/front_ends/fastapi/main.py +72 -0
  223. aiq/front_ends/fastapi/message_handler.py +298 -0
  224. aiq/front_ends/fastapi/message_validator.py +345 -0
  225. aiq/front_ends/fastapi/register.py +25 -0
  226. aiq/front_ends/fastapi/response_helpers.py +195 -0
  227. aiq/front_ends/fastapi/step_adaptor.py +321 -0
  228. aiq/front_ends/mcp/__init__.py +14 -0
  229. aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
  230. aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
  231. aiq/front_ends/mcp/register.py +27 -0
  232. aiq/front_ends/mcp/tool_converter.py +242 -0
  233. aiq/front_ends/register.py +22 -0
  234. aiq/front_ends/simple_base/__init__.py +14 -0
  235. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
  236. aiq/llm/__init__.py +0 -0
  237. aiq/llm/aws_bedrock_llm.py +57 -0
  238. aiq/llm/nim_llm.py +46 -0
  239. aiq/llm/openai_llm.py +46 -0
  240. aiq/llm/register.py +23 -0
  241. aiq/llm/utils/__init__.py +14 -0
  242. aiq/llm/utils/env_config_value.py +94 -0
  243. aiq/llm/utils/error.py +17 -0
  244. aiq/memory/__init__.py +20 -0
  245. aiq/memory/interfaces.py +183 -0
  246. aiq/memory/models.py +112 -0
  247. aiq/meta/module_to_distro.json +3 -0
  248. aiq/meta/pypi.md +58 -0
  249. aiq/object_store/__init__.py +20 -0
  250. aiq/object_store/in_memory_object_store.py +76 -0
  251. aiq/object_store/interfaces.py +84 -0
  252. aiq/object_store/models.py +36 -0
  253. aiq/object_store/register.py +20 -0
  254. aiq/observability/__init__.py +14 -0
  255. aiq/observability/exporter/__init__.py +14 -0
  256. aiq/observability/exporter/base_exporter.py +449 -0
  257. aiq/observability/exporter/exporter.py +78 -0
  258. aiq/observability/exporter/file_exporter.py +33 -0
  259. aiq/observability/exporter/processing_exporter.py +322 -0
  260. aiq/observability/exporter/raw_exporter.py +52 -0
  261. aiq/observability/exporter/span_exporter.py +265 -0
  262. aiq/observability/exporter_manager.py +335 -0
  263. aiq/observability/mixin/__init__.py +14 -0
  264. aiq/observability/mixin/batch_config_mixin.py +26 -0
  265. aiq/observability/mixin/collector_config_mixin.py +23 -0
  266. aiq/observability/mixin/file_mixin.py +288 -0
  267. aiq/observability/mixin/file_mode.py +23 -0
  268. aiq/observability/mixin/resource_conflict_mixin.py +134 -0
  269. aiq/observability/mixin/serialize_mixin.py +61 -0
  270. aiq/observability/mixin/type_introspection_mixin.py +183 -0
  271. aiq/observability/processor/__init__.py +14 -0
  272. aiq/observability/processor/batching_processor.py +310 -0
  273. aiq/observability/processor/callback_processor.py +42 -0
  274. aiq/observability/processor/intermediate_step_serializer.py +28 -0
  275. aiq/observability/processor/processor.py +71 -0
  276. aiq/observability/register.py +96 -0
  277. aiq/observability/utils/__init__.py +14 -0
  278. aiq/observability/utils/dict_utils.py +236 -0
  279. aiq/observability/utils/time_utils.py +31 -0
  280. aiq/plugins/.namespace +1 -0
  281. aiq/profiler/__init__.py +0 -0
  282. aiq/profiler/calc/__init__.py +14 -0
  283. aiq/profiler/calc/calc_runner.py +627 -0
  284. aiq/profiler/calc/calculations.py +288 -0
  285. aiq/profiler/calc/data_models.py +188 -0
  286. aiq/profiler/calc/plot.py +345 -0
  287. aiq/profiler/callbacks/__init__.py +0 -0
  288. aiq/profiler/callbacks/agno_callback_handler.py +295 -0
  289. aiq/profiler/callbacks/base_callback_class.py +20 -0
  290. aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
  291. aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
  292. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
  293. aiq/profiler/callbacks/token_usage_base_model.py +27 -0
  294. aiq/profiler/data_frame_row.py +51 -0
  295. aiq/profiler/data_models.py +24 -0
  296. aiq/profiler/decorators/__init__.py +0 -0
  297. aiq/profiler/decorators/framework_wrapper.py +131 -0
  298. aiq/profiler/decorators/function_tracking.py +254 -0
  299. aiq/profiler/forecasting/__init__.py +0 -0
  300. aiq/profiler/forecasting/config.py +18 -0
  301. aiq/profiler/forecasting/model_trainer.py +75 -0
  302. aiq/profiler/forecasting/models/__init__.py +22 -0
  303. aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
  304. aiq/profiler/forecasting/models/linear_model.py +196 -0
  305. aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
  306. aiq/profiler/inference_metrics_model.py +28 -0
  307. aiq/profiler/inference_optimization/__init__.py +0 -0
  308. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  309. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
  310. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
  311. aiq/profiler/inference_optimization/data_models.py +386 -0
  312. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  313. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
  314. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
  315. aiq/profiler/inference_optimization/llm_metrics.py +212 -0
  316. aiq/profiler/inference_optimization/prompt_caching.py +163 -0
  317. aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
  318. aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
  319. aiq/profiler/intermediate_property_adapter.py +102 -0
  320. aiq/profiler/profile_runner.py +473 -0
  321. aiq/profiler/utils.py +184 -0
  322. aiq/registry_handlers/__init__.py +0 -0
  323. aiq/registry_handlers/local/__init__.py +0 -0
  324. aiq/registry_handlers/local/local_handler.py +176 -0
  325. aiq/registry_handlers/local/register_local.py +37 -0
  326. aiq/registry_handlers/metadata_factory.py +60 -0
  327. aiq/registry_handlers/package_utils.py +567 -0
  328. aiq/registry_handlers/pypi/__init__.py +0 -0
  329. aiq/registry_handlers/pypi/pypi_handler.py +251 -0
  330. aiq/registry_handlers/pypi/register_pypi.py +40 -0
  331. aiq/registry_handlers/register.py +21 -0
  332. aiq/registry_handlers/registry_handler_base.py +157 -0
  333. aiq/registry_handlers/rest/__init__.py +0 -0
  334. aiq/registry_handlers/rest/register_rest.py +56 -0
  335. aiq/registry_handlers/rest/rest_handler.py +237 -0
  336. aiq/registry_handlers/schemas/__init__.py +0 -0
  337. aiq/registry_handlers/schemas/headers.py +42 -0
  338. aiq/registry_handlers/schemas/package.py +68 -0
  339. aiq/registry_handlers/schemas/publish.py +63 -0
  340. aiq/registry_handlers/schemas/pull.py +82 -0
  341. aiq/registry_handlers/schemas/remove.py +36 -0
  342. aiq/registry_handlers/schemas/search.py +91 -0
  343. aiq/registry_handlers/schemas/status.py +47 -0
  344. aiq/retriever/__init__.py +0 -0
  345. aiq/retriever/interface.py +37 -0
  346. aiq/retriever/milvus/__init__.py +14 -0
  347. aiq/retriever/milvus/register.py +81 -0
  348. aiq/retriever/milvus/retriever.py +228 -0
  349. aiq/retriever/models.py +74 -0
  350. aiq/retriever/nemo_retriever/__init__.py +14 -0
  351. aiq/retriever/nemo_retriever/register.py +60 -0
  352. aiq/retriever/nemo_retriever/retriever.py +190 -0
  353. aiq/retriever/register.py +22 -0
  354. aiq/runtime/__init__.py +14 -0
  355. aiq/runtime/loader.py +215 -0
  356. aiq/runtime/runner.py +190 -0
  357. aiq/runtime/session.py +158 -0
  358. aiq/runtime/user_metadata.py +130 -0
  359. aiq/settings/__init__.py +0 -0
  360. aiq/settings/global_settings.py +318 -0
  361. aiq/test/.namespace +1 -0
  362. aiq/tool/__init__.py +0 -0
  363. aiq/tool/chat_completion.py +74 -0
  364. aiq/tool/code_execution/README.md +151 -0
  365. aiq/tool/code_execution/__init__.py +0 -0
  366. aiq/tool/code_execution/code_sandbox.py +267 -0
  367. aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
  368. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
  369. aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
  370. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
  371. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
  372. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
  373. aiq/tool/code_execution/register.py +74 -0
  374. aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
  375. aiq/tool/code_execution/utils.py +100 -0
  376. aiq/tool/datetime_tools.py +42 -0
  377. aiq/tool/document_search.py +141 -0
  378. aiq/tool/github_tools/__init__.py +0 -0
  379. aiq/tool/github_tools/create_github_commit.py +133 -0
  380. aiq/tool/github_tools/create_github_issue.py +87 -0
  381. aiq/tool/github_tools/create_github_pr.py +106 -0
  382. aiq/tool/github_tools/get_github_file.py +106 -0
  383. aiq/tool/github_tools/get_github_issue.py +166 -0
  384. aiq/tool/github_tools/get_github_pr.py +256 -0
  385. aiq/tool/github_tools/update_github_issue.py +100 -0
  386. aiq/tool/mcp/__init__.py +14 -0
  387. aiq/tool/mcp/exceptions.py +142 -0
  388. aiq/tool/mcp/mcp_client.py +255 -0
  389. aiq/tool/mcp/mcp_tool.py +96 -0
  390. aiq/tool/memory_tools/__init__.py +0 -0
  391. aiq/tool/memory_tools/add_memory_tool.py +79 -0
  392. aiq/tool/memory_tools/delete_memory_tool.py +67 -0
  393. aiq/tool/memory_tools/get_memory_tool.py +72 -0
  394. aiq/tool/nvidia_rag.py +95 -0
  395. aiq/tool/register.py +38 -0
  396. aiq/tool/retriever.py +89 -0
  397. aiq/tool/server_tools.py +66 -0
  398. aiq/utils/__init__.py +0 -0
  399. aiq/utils/data_models/__init__.py +0 -0
  400. aiq/utils/data_models/schema_validator.py +58 -0
  401. aiq/utils/debugging_utils.py +43 -0
  402. aiq/utils/dump_distro_mapping.py +32 -0
  403. aiq/utils/exception_handlers/__init__.py +0 -0
  404. aiq/utils/exception_handlers/automatic_retries.py +289 -0
  405. aiq/utils/exception_handlers/mcp.py +211 -0
  406. aiq/utils/exception_handlers/schemas.py +114 -0
  407. aiq/utils/io/__init__.py +0 -0
  408. aiq/utils/io/model_processing.py +28 -0
  409. aiq/utils/io/yaml_tools.py +119 -0
  410. aiq/utils/log_utils.py +37 -0
  411. aiq/utils/metadata_utils.py +74 -0
  412. aiq/utils/optional_imports.py +142 -0
  413. aiq/utils/producer_consumer_queue.py +178 -0
  414. aiq/utils/reactive/__init__.py +0 -0
  415. aiq/utils/reactive/base/__init__.py +0 -0
  416. aiq/utils/reactive/base/observable_base.py +65 -0
  417. aiq/utils/reactive/base/observer_base.py +55 -0
  418. aiq/utils/reactive/base/subject_base.py +79 -0
  419. aiq/utils/reactive/observable.py +59 -0
  420. aiq/utils/reactive/observer.py +76 -0
  421. aiq/utils/reactive/subject.py +131 -0
  422. aiq/utils/reactive/subscription.py +49 -0
  423. aiq/utils/settings/__init__.py +0 -0
  424. aiq/utils/settings/global_settings.py +197 -0
  425. aiq/utils/string_utils.py +38 -0
  426. aiq/utils/type_converter.py +290 -0
  427. aiq/utils/type_utils.py +484 -0
  428. aiq/utils/url_utils.py +27 -0
  429. nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
  430. nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
  431. nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
  432. nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
  433. nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
  434. nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
  435. nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
@@ -0,0 +1,154 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License..
15
+
16
+ import typing
17
+
18
+ from pydantic import Field
19
+ from pydantic import model_validator
20
+
21
+ from aiq.data_models.component_ref import LLMRef
22
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
23
+
24
+
25
+ class LLMBasedPlanSelectionConfig(TTCStrategyBaseConfig, name="llm_based_plan_selection"):
26
+ """
27
+ Configuration for LLMBasedSelection.
28
+ """
29
+ selection_llm: LLMRef | typing.Any | None = Field(
30
+ default=None,
31
+ description="The LLM to use for selecting the best plan. This can be an instance of an LLM client.")
32
+
33
+ selection_template: str = Field(
34
+ default=("You are tasked with selecting the best plan from several alternative plans."
35
+ " Review the following plans and their feedback carefully to select the most "
36
+ "comprehensive, efficient, and effective one."
37
+ "The plan is for an agent system with the following objective and context:\n\n"
38
+ "{context}\n\n"
39
+ "The system is asked to achieve the following goal:\n\n"
40
+ "{original_prompt}\n\n"
41
+ "The generated plans are as follows."
42
+ "\n\n{plans}"
43
+ "\n\nBased on your analysis, which plan (numbered 1 and onwards) is the best? "
44
+ "Provide a thorough explanation of your choice,"
45
+ " referencing specific strengths from the feedback and how they outweigh any weaknesses."
46
+ "Make sure you begin your choice of selected plan with the words 'SELECTED PLAN:' "
47
+ "followed by the plan number."),
48
+ description="The template to use for selecting the best plan. This should guide the LLM on how to evaluate "
49
+ "the plans and select the best one. Ensure it is clear and concise.")
50
+
51
+ @model_validator(mode="before")
52
+ def validate_strategies(cls, values: dict[str, typing.Any]) -> dict[str, typing.Any]:
53
+ """
54
+ Ensure that the selection_llm is provided when using LLMBasedSelection.
55
+ """
56
+ if values.get('selection_llm') is None:
57
+ raise ValueError('selection_llm must be provided when'
58
+ ' selection_strategy is set to LLM_BASED_PLAN_SELECTION.')
59
+
60
+ return values
61
+
62
+
63
+ class LLMBasedAgentOutputSelectionConfig(TTCStrategyBaseConfig, name="llm_based_agent_output_selection"):
64
+ """
65
+ Configuration for LLMBasedSelection.
66
+ """
67
+ selection_llm: LLMRef | typing.Any | None = Field(
68
+ default=None,
69
+ description="The LLM to use for selecting the best plan. This can be an instance of an LLM client.")
70
+
71
+ selection_template: str = Field(
72
+ default=("You are tasked with selecting the best output from several output."
73
+ "The outputs are from an agent system whose object and input will be provided below.\n "
74
+ "Review all the outputs and select one that fits the best. You will do this by "
75
+ "looking at how many outputs have the same classification. Chose the one that has the most. "
76
+ "Of the ones that have the same classification, choose the one that is the most complete, "
77
+ "clear, and comprehensive. The objective of the agent is: \n"
78
+ "{objective}\n\n"
79
+ "\n\nThe agent is asked to achieve the following goal:\n\n"
80
+ "{input}\n\n"
81
+ "The generated outputs are as follows."
82
+ "\n\n{results}"
83
+ "\n\nBased on your analysis, which plan (numbered 1 and onwards) is the best? "
84
+ "Provide a thorough explanation of your choice,"
85
+ " referencing specific strengths from the feedback and how they outweigh any weaknesses."
86
+ "You must ALWAYS select an option, even if the options are identical or similar. "
87
+ "Make sure you begin your choice of selected plan with the words 'SELECTED ITEM:' "
88
+ "followed by the plan number."),
89
+ description="The template to use for selecting the best output. This should guide the LLM on how to evaluate "
90
+ "the outputs and select the best one. Ensure it is clear and concise. Must contain {objective}, "
91
+ "{input}, and {results} ")
92
+
93
+ @model_validator(mode="before")
94
+ def validate_strategies(cls, values: dict[str, typing.Any]) -> dict[str, typing.Any]:
95
+ """
96
+ Ensure that the selection_llm is provided when using LLMBasedSelection.
97
+ """
98
+ if values.get('selection_llm') is None:
99
+ raise ValueError('selection_llm must be provided when '
100
+ 'selection_strategy is set to LLM_BASED_AGENT_OUTPUT_SELECTION.')
101
+
102
+ return values
103
+
104
+
105
+ class LLMBasedOutputMergingConfig(TTCStrategyBaseConfig, name="llm_based_agent_output_merging"):
106
+ """
107
+ Configuration for LLMBasedSelection.
108
+ """
109
+ selection_llm: LLMRef | typing.Any | None = Field(
110
+ default=None,
111
+ description="The LLM to use for selecting the best plan. This can be an instance of an LLM client.")
112
+
113
+ selection_template: str = Field(
114
+ default=("You are tasked with merging the output of an agent systems that produces {pipeline_type}."
115
+ "The outputs are from an agent system whose objective and input will be provided below.\n "
116
+ "Review all the outputs, please combine them all into one output, keeping with the intended structure "
117
+ "generated by the outputs and general tone. Capture the important pieces of each of the outputs "
118
+ "to create comprehensive output that achieves the input and objective. "
119
+ "The objective of the agent is: \n"
120
+ "{objective}\n\n"
121
+ "\n\nThe agent is asked to achieve the following goal:\n\n"
122
+ "{input}\n\n"
123
+ "The generated outputs are as follows."
124
+ "\n\n{results}"
125
+ "\n\n Make sure you begin your updated output with the words 'MERGED OUTPUT:' "),
126
+ description="The template to use for selecting the best output. This should guide the LLM on how to evaluate "
127
+ "the outputs and select the best one. Ensure it is clear and concise. Must contain {objective}, "
128
+ "{input}, and {results} ")
129
+
130
+ @model_validator(mode="before")
131
+ def validate_strategies(cls, values: dict[str, typing.Any]) -> dict[str, typing.Any]:
132
+ """
133
+ Ensure that the selection_llm is provided when using LLMBasedSelection.
134
+ """
135
+ if values.get('selection_llm') is None:
136
+ raise ValueError('selection_llm must be provided when '
137
+ 'selection_strategy is set to LLM_BASED_AGENT_OUTPUT_SELECTION.')
138
+
139
+ return values
140
+
141
+
142
+ class ThresholdSelectionConfig(TTCStrategyBaseConfig, name="threshold_selection"):
143
+ """
144
+ Configuration for a selection strategy that keeps only the items
145
+ whose scores exceed a specified threshold.
146
+ """
147
+ threshold: float = Field(default=5.0, description="Only keep TTCItems with score >= this value.")
148
+
149
+
150
+ class BestOfNSelectionConfig(TTCStrategyBaseConfig, name="best_of_n_selection"):
151
+ """
152
+ Configuration for Best of N Selection
153
+ """
154
+ pass
@@ -0,0 +1,43 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from enum import Enum
17
+
18
+
19
+ class PipelineTypeEnum(str, Enum):
20
+ """
21
+ Enum to represent the type of pipeline used in Inference Time Scaling.
22
+ """
23
+ PLANNING = "planning"
24
+ TOOL_USE = "tool_use"
25
+ AGENT_EXECUTION = "agent_execution"
26
+ CUSTOM = "custom"
27
+
28
+ def __str__(self) -> str:
29
+ return self.value
30
+
31
+
32
+ class StageTypeEnum(str, Enum):
33
+ """
34
+ Enum to represent the type of stage in a pipeline.
35
+ """
36
+ SEARCH = "search"
37
+ EDITING = "editing"
38
+ SCORING = "scoring"
39
+ SELECTION = "selection"
40
+ CUSTOM = "custom"
41
+
42
+ def __str__(self) -> str:
43
+ return self.value
@@ -0,0 +1,66 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from abc import ABC
17
+ from abc import abstractmethod
18
+
19
+ from aiq.builder.builder import Builder
20
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
21
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum, PipelineTypeEnum
22
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
23
+
24
+
25
+ class StrategyBase(ABC):
26
+ """
27
+ Abstract base class for strategy implementations.
28
+
29
+ This class defines the interface for strategies that can be used in the
30
+ TTC framework. Concrete strategy classes should
31
+ implement the methods defined in this class.
32
+ """
33
+
34
+ def __init__(self, config: TTCStrategyBaseConfig) -> None:
35
+ self.config: TTCStrategyBaseConfig = config
36
+ self.pipeline_type: PipelineTypeEnum | None = None
37
+
38
+ @abstractmethod
39
+ async def build_components(self, builder: Builder) -> None:
40
+ """Build the components required for the selector."""
41
+ pass
42
+
43
+ @abstractmethod
44
+ async def ainvoke(self,
45
+ items: list[TTCItem],
46
+ original_prompt: str | None = None,
47
+ agent_context: str | None = None,
48
+ **kwargs) -> [TTCItem]:
49
+ pass
50
+
51
+ @abstractmethod
52
+ def supported_pipeline_types(self) -> [PipelineTypeEnum]:
53
+ """Return the stage types supported by this selector."""
54
+ pass
55
+
56
+ @abstractmethod
57
+ def stage_type(self) -> StageTypeEnum:
58
+ """Return the stage type of this strategy."""
59
+ pass
60
+
61
+ def set_pipeline_type(self, pipeline_type: PipelineTypeEnum) -> None:
62
+ """Set the pipeline type for this strategy."""
63
+ if pipeline_type in self.supported_pipeline_types():
64
+ self.pipeline_type = pipeline_type
65
+ else:
66
+ raise ValueError(f"Pipeline type {pipeline_type} is not supported by this strategy.")
@@ -0,0 +1,41 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from pydantic import BaseModel
17
+ from pydantic import Field
18
+
19
+
20
+ class ToolUseInputSchema(BaseModel):
21
+ """
22
+ Input schema for the tool use function.
23
+ """
24
+ tool_name: str = Field(description="The name of the tool to use. Must be registered in the system.", )
25
+ task_description: str = Field(description="The description of the task to perform with the tool.", )
26
+ motivation: str | None = Field(
27
+ default=None,
28
+ description="An optional motivation for the tool use, providing additional context or reasoning.",
29
+ )
30
+ output: str | None = Field(
31
+ default=None,
32
+ description="The output of the tool use. This can be used to store the result of the tool execution.",
33
+ )
34
+
35
+
36
+ class ToolUselist(BaseModel):
37
+ """
38
+ A list of tools to use.
39
+ """
40
+ tools: list[ToolUseInputSchema] = Field(
41
+ description="A list of tool use inputs, each containing the tool name and task description.", )
@@ -0,0 +1,48 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import typing
17
+
18
+ from pydantic import BaseModel
19
+ from pydantic import ConfigDict
20
+ from pydantic import Field
21
+
22
+
23
+ class TTCItem(BaseModel):
24
+ """
25
+ Represents an item in the TTC functions and pipelines
26
+ """
27
+ model_config = ConfigDict(extra="allow")
28
+
29
+ input: typing.Any | None = Field(default=None,
30
+ description="Input to the function or pipeline. "
31
+ "This can be a structured tool call, or other info.")
32
+ output: typing.Any | None = Field(default=None,
33
+ description="Output from the function or pipeline. "
34
+ "This can be a structured tool call, or other info.")
35
+ plan: typing.Any | None = Field(default=None, description="Search plan for downstream agent(s).")
36
+ feedback: str | None = Field(default=None,
37
+ description="Feedback "
38
+ "provided by feedback steps to improve the plan.")
39
+ score: float | None = Field(default=None,
40
+ description="Score of the plan based on feedback or other evaluation criteria. "
41
+ "This can be used to rank plans.")
42
+ metadata: typing.Any | None = Field(default=None,
43
+ description="Additional information. This can be"
44
+ " a structured tool call, or other info not "
45
+ "in the plan.")
46
+ name: str | None = Field(default=None,
47
+ description="Name of the item or function"
48
+ ", used for identification in pipelines.")
@@ -0,0 +1,36 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ # pylint: disable=unused-import
17
+ # flake8: noqa
18
+
19
+ from .editing import iterative_plan_refinement_editor
20
+ from .editing import llm_as_a_judge_editor
21
+ from .editing import motivation_aware_summarization
22
+ from .functions import execute_score_select_function
23
+ from .functions import its_tool_orchestration_function
24
+ from .functions import its_tool_wrapper_function
25
+ from .functions import plan_select_execute_function
26
+ from .scoring import llm_based_agent_scorer
27
+ from .scoring import llm_based_plan_scorer
28
+ from .scoring import motivation_aware_scorer
29
+ from .search import multi_llm_planner
30
+ from .search import multi_query_retrieval_search
31
+ from .search import single_shot_multi_plan_planner
32
+ from .selection import best_of_n_selector
33
+ from .selection import llm_based_agent_output_selector
34
+ from .selection import llm_based_output_merging_selector
35
+ from .selection import llm_based_plan_selector
36
+ from .selection import threshold_selector
File without changes
@@ -0,0 +1,168 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import re
19
+
20
+ from aiq.builder.builder import Builder
21
+ from aiq.builder.framework_enum import LLMFrameworkEnum
22
+ from aiq.cli.register_workflow import register_ttc_strategy
23
+ from aiq.data_models.ttc_strategy import TTCStrategyBaseConfig
24
+ from aiq.experimental.test_time_compute.models.scoring_config import LLMBasedAgentScoringConfig
25
+ from aiq.experimental.test_time_compute.models.stage_enums import PipelineTypeEnum
26
+ from aiq.experimental.test_time_compute.models.stage_enums import StageTypeEnum
27
+ from aiq.experimental.test_time_compute.models.strategy_base import StrategyBase
28
+ from aiq.experimental.test_time_compute.models.ttc_item import TTCItem
29
+ from aiq.utils.io.model_processing import remove_r1_think_tags
30
+
31
+ logger = logging.getLogger(__name__)
32
+
33
+
34
+ class LLMBasedAgentScorer(StrategyBase):
35
+
36
+ def __init__(self, config: TTCStrategyBaseConfig) -> None:
37
+ super().__init__(config)
38
+ self.llm_bound = None
39
+
40
+ async def build_components(self, builder: Builder) -> None:
41
+ """
42
+ Build the components required for the planner.
43
+ """
44
+ self.llm_bound = await builder.get_llm(self.config.scoring_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
45
+
46
+ def supported_pipeline_types(self) -> [PipelineTypeEnum]:
47
+ return [PipelineTypeEnum.AGENT_EXECUTION]
48
+
49
+ def stage_type(self) -> StageTypeEnum:
50
+ return StageTypeEnum.SCORING
51
+
52
+ async def score_single(self, original_prompt: str, agent_context: str, item: TTCItem) -> float:
53
+ """
54
+ Score a single planning item using the LLM.
55
+
56
+ Args:
57
+ original_prompt (str): The original prompt.
58
+ agent_context (str): The agent context.
59
+ item (TTCItem): The item to score.
60
+
61
+ Returns:
62
+ float: The score of the item.
63
+ """
64
+
65
+ try:
66
+ from langchain_core.language_models import BaseChatModel
67
+ from langchain_core.prompts import PromptTemplate
68
+ except ImportError:
69
+ raise ImportError("langchain-core is not installed. Please install it to use SingleShotMultiPlanPlanner.\n"
70
+ "This error can be resolved by installing aiqtoolkit-langchain.")
71
+
72
+ if not isinstance(self.llm_bound, BaseChatModel):
73
+ raise ValueError("The `scoring_llm` must be an instance of `BaseChatModel`.")
74
+
75
+ model: BaseChatModel = self.llm_bound
76
+
77
+ prompt_template = PromptTemplate(
78
+ template=self.config.scoring_template,
79
+ input_variables=["objective", "input", "output"],
80
+ validate_template=True,
81
+ )
82
+
83
+ prompt = (await prompt_template.ainvoke(
84
+ input={
85
+ "objective": agent_context,
86
+ "input": str(item.input) if not original_prompt else original_prompt,
87
+ "output": str(item.output)
88
+ }))
89
+
90
+ response = (await model.ainvoke(prompt)).content
91
+ response = remove_r1_think_tags(response)
92
+
93
+ # Score will following the format of `FINAL SCORE: <float>` in the response from the LLM
94
+ if not isinstance(response, str):
95
+ logger.warning(f"Invalid response from LLM for scoring: {response}.")
96
+ raise ValueError("Unable to parse the score from the LLM response.")
97
+
98
+ response = response.strip()
99
+ match = re.search(r'FINAL SCORE:\s*([\d.]+)', response)
100
+ if not match:
101
+ logger.warning(f"Could not parse the score from the response: {response}.")
102
+ score_str = '0.0'
103
+ else:
104
+ score_str = match.group(1)
105
+
106
+ try:
107
+ score = float(score_str)
108
+ except ValueError:
109
+ logger.warning(f"Could not convert the score string '{score_str}' to float.")
110
+ raise ValueError(f"Unable to convert the extracted score '{score_str}' to a float.")
111
+
112
+ return score
113
+
114
+ async def ainvoke(self,
115
+ items: list[TTCItem],
116
+ original_prompt: str | None = None,
117
+ agent_context: str | None = None,
118
+ **kwargs) -> list[TTCItem]:
119
+ """
120
+ Score a list of planning items.
121
+
122
+ Args:
123
+ original_prompt (str): The original prompt.
124
+ agent_context (str): The agent context.
125
+ items (list[TTCItem]): The list of planning items to score.
126
+
127
+ Returns:
128
+ list[float]: A list of scores corresponding to each planning item.
129
+ """
130
+ # Run score single concurrently for all planning items
131
+ # Then set the score attribute on each planning item
132
+ if not items:
133
+ return []
134
+ tasks = [
135
+ self.score_single(original_prompt=original_prompt, agent_context=agent_context, item=item) for item in items
136
+ ]
137
+
138
+ # Gather all scores concurrently
139
+ scores = await asyncio.gather(*tasks)
140
+
141
+ if len(scores) != len(items):
142
+ logger.warning(f"Number of scores {len(scores)} does not match the number of items {len(items)}.")
143
+ raise ValueError("Mismatch in number of scores and planning items.")
144
+
145
+ logger.debug("Scores for planning items: %s", scores)
146
+
147
+ # Set the score on each planning item for reference
148
+ for idx, score in enumerate(scores):
149
+ items[idx].score = score
150
+
151
+ return items
152
+
153
+
154
+ @register_ttc_strategy(config_type=LLMBasedAgentScoringConfig)
155
+ async def register_llm_based_agent_scorer(config: LLMBasedAgentScoringConfig, builder: Builder):
156
+ """
157
+ Register the LLM-based agent scorer with the provided configuration and builder.
158
+
159
+ Args:
160
+ config (LLMBasedAgentScoringConfig): The configuration for the LLM-based agent scorer.
161
+ builder (Builder): The builder instance to use for building components.
162
+
163
+ Returns:
164
+ LLMBasedAgentScorer: The registered LLM-based agent scorer.
165
+ """
166
+ scorer = LLMBasedAgentScorer(config)
167
+ await scorer.build_components(builder)
168
+ yield scorer