aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show
  1. aiqtoolkit-1.2rc9.dist-info/METADATA +29 -0
  2. aiqtoolkit-1.2rc9.dist-info/RECORD +4 -0
  3. aiqtoolkit-1.2rc9.dist-info/top_level.txt +1 -0
  4. aiq/agent/__init__.py +0 -0
  5. aiq/agent/base.py +0 -239
  6. aiq/agent/dual_node.py +0 -67
  7. aiq/agent/react_agent/__init__.py +0 -0
  8. aiq/agent/react_agent/agent.py +0 -355
  9. aiq/agent/react_agent/output_parser.py +0 -104
  10. aiq/agent/react_agent/prompt.py +0 -41
  11. aiq/agent/react_agent/register.py +0 -149
  12. aiq/agent/reasoning_agent/__init__.py +0 -0
  13. aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
  14. aiq/agent/register.py +0 -23
  15. aiq/agent/rewoo_agent/__init__.py +0 -0
  16. aiq/agent/rewoo_agent/agent.py +0 -411
  17. aiq/agent/rewoo_agent/prompt.py +0 -108
  18. aiq/agent/rewoo_agent/register.py +0 -158
  19. aiq/agent/tool_calling_agent/__init__.py +0 -0
  20. aiq/agent/tool_calling_agent/agent.py +0 -119
  21. aiq/agent/tool_calling_agent/register.py +0 -106
  22. aiq/authentication/__init__.py +0 -14
  23. aiq/authentication/api_key/__init__.py +0 -14
  24. aiq/authentication/api_key/api_key_auth_provider.py +0 -96
  25. aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
  26. aiq/authentication/api_key/register.py +0 -26
  27. aiq/authentication/exceptions/__init__.py +0 -14
  28. aiq/authentication/exceptions/api_key_exceptions.py +0 -38
  29. aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
  30. aiq/authentication/exceptions/call_back_exceptions.py +0 -38
  31. aiq/authentication/exceptions/request_exceptions.py +0 -54
  32. aiq/authentication/http_basic_auth/__init__.py +0 -0
  33. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
  34. aiq/authentication/http_basic_auth/register.py +0 -30
  35. aiq/authentication/interfaces.py +0 -93
  36. aiq/authentication/oauth2/__init__.py +0 -14
  37. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
  38. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
  39. aiq/authentication/oauth2/register.py +0 -25
  40. aiq/authentication/register.py +0 -21
  41. aiq/builder/__init__.py +0 -0
  42. aiq/builder/builder.py +0 -285
  43. aiq/builder/component_utils.py +0 -316
  44. aiq/builder/context.py +0 -264
  45. aiq/builder/embedder.py +0 -24
  46. aiq/builder/eval_builder.py +0 -161
  47. aiq/builder/evaluator.py +0 -29
  48. aiq/builder/framework_enum.py +0 -24
  49. aiq/builder/front_end.py +0 -73
  50. aiq/builder/function.py +0 -344
  51. aiq/builder/function_base.py +0 -380
  52. aiq/builder/function_info.py +0 -627
  53. aiq/builder/intermediate_step_manager.py +0 -174
  54. aiq/builder/llm.py +0 -25
  55. aiq/builder/retriever.py +0 -25
  56. aiq/builder/user_interaction_manager.py +0 -74
  57. aiq/builder/workflow.py +0 -148
  58. aiq/builder/workflow_builder.py +0 -1117
  59. aiq/cli/__init__.py +0 -14
  60. aiq/cli/cli_utils/__init__.py +0 -0
  61. aiq/cli/cli_utils/config_override.py +0 -231
  62. aiq/cli/cli_utils/validation.py +0 -37
  63. aiq/cli/commands/__init__.py +0 -0
  64. aiq/cli/commands/configure/__init__.py +0 -0
  65. aiq/cli/commands/configure/channel/__init__.py +0 -0
  66. aiq/cli/commands/configure/channel/add.py +0 -28
  67. aiq/cli/commands/configure/channel/channel.py +0 -36
  68. aiq/cli/commands/configure/channel/remove.py +0 -30
  69. aiq/cli/commands/configure/channel/update.py +0 -30
  70. aiq/cli/commands/configure/configure.py +0 -33
  71. aiq/cli/commands/evaluate.py +0 -139
  72. aiq/cli/commands/info/__init__.py +0 -14
  73. aiq/cli/commands/info/info.py +0 -39
  74. aiq/cli/commands/info/list_channels.py +0 -32
  75. aiq/cli/commands/info/list_components.py +0 -129
  76. aiq/cli/commands/info/list_mcp.py +0 -213
  77. aiq/cli/commands/registry/__init__.py +0 -14
  78. aiq/cli/commands/registry/publish.py +0 -88
  79. aiq/cli/commands/registry/pull.py +0 -118
  80. aiq/cli/commands/registry/registry.py +0 -38
  81. aiq/cli/commands/registry/remove.py +0 -108
  82. aiq/cli/commands/registry/search.py +0 -155
  83. aiq/cli/commands/sizing/__init__.py +0 -14
  84. aiq/cli/commands/sizing/calc.py +0 -297
  85. aiq/cli/commands/sizing/sizing.py +0 -27
  86. aiq/cli/commands/start.py +0 -246
  87. aiq/cli/commands/uninstall.py +0 -81
  88. aiq/cli/commands/validate.py +0 -47
  89. aiq/cli/commands/workflow/__init__.py +0 -14
  90. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  91. aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
  92. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
  93. aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
  94. aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
  95. aiq/cli/commands/workflow/workflow.py +0 -37
  96. aiq/cli/commands/workflow/workflow_commands.py +0 -313
  97. aiq/cli/entrypoint.py +0 -135
  98. aiq/cli/main.py +0 -44
  99. aiq/cli/register_workflow.py +0 -488
  100. aiq/cli/type_registry.py +0 -1000
  101. aiq/data_models/__init__.py +0 -14
  102. aiq/data_models/api_server.py +0 -694
  103. aiq/data_models/authentication.py +0 -231
  104. aiq/data_models/common.py +0 -171
  105. aiq/data_models/component.py +0 -54
  106. aiq/data_models/component_ref.py +0 -168
  107. aiq/data_models/config.py +0 -406
  108. aiq/data_models/dataset_handler.py +0 -123
  109. aiq/data_models/discovery_metadata.py +0 -335
  110. aiq/data_models/embedder.py +0 -27
  111. aiq/data_models/evaluate.py +0 -127
  112. aiq/data_models/evaluator.py +0 -26
  113. aiq/data_models/front_end.py +0 -26
  114. aiq/data_models/function.py +0 -30
  115. aiq/data_models/function_dependencies.py +0 -72
  116. aiq/data_models/interactive.py +0 -246
  117. aiq/data_models/intermediate_step.py +0 -302
  118. aiq/data_models/invocation_node.py +0 -38
  119. aiq/data_models/its_strategy.py +0 -30
  120. aiq/data_models/llm.py +0 -27
  121. aiq/data_models/logging.py +0 -26
  122. aiq/data_models/memory.py +0 -27
  123. aiq/data_models/object_store.py +0 -44
  124. aiq/data_models/profiler.py +0 -54
  125. aiq/data_models/registry_handler.py +0 -26
  126. aiq/data_models/retriever.py +0 -30
  127. aiq/data_models/retry_mixin.py +0 -35
  128. aiq/data_models/span.py +0 -187
  129. aiq/data_models/step_adaptor.py +0 -64
  130. aiq/data_models/streaming.py +0 -33
  131. aiq/data_models/swe_bench_model.py +0 -54
  132. aiq/data_models/telemetry_exporter.py +0 -26
  133. aiq/embedder/__init__.py +0 -0
  134. aiq/embedder/langchain_client.py +0 -41
  135. aiq/embedder/nim_embedder.py +0 -59
  136. aiq/embedder/openai_embedder.py +0 -43
  137. aiq/embedder/register.py +0 -24
  138. aiq/eval/__init__.py +0 -14
  139. aiq/eval/config.py +0 -60
  140. aiq/eval/dataset_handler/__init__.py +0 -0
  141. aiq/eval/dataset_handler/dataset_downloader.py +0 -106
  142. aiq/eval/dataset_handler/dataset_filter.py +0 -52
  143. aiq/eval/dataset_handler/dataset_handler.py +0 -254
  144. aiq/eval/evaluate.py +0 -506
  145. aiq/eval/evaluator/__init__.py +0 -14
  146. aiq/eval/evaluator/base_evaluator.py +0 -73
  147. aiq/eval/evaluator/evaluator_model.py +0 -45
  148. aiq/eval/intermediate_step_adapter.py +0 -99
  149. aiq/eval/rag_evaluator/__init__.py +0 -0
  150. aiq/eval/rag_evaluator/evaluate.py +0 -178
  151. aiq/eval/rag_evaluator/register.py +0 -143
  152. aiq/eval/register.py +0 -23
  153. aiq/eval/remote_workflow.py +0 -133
  154. aiq/eval/runners/__init__.py +0 -14
  155. aiq/eval/runners/config.py +0 -39
  156. aiq/eval/runners/multi_eval_runner.py +0 -54
  157. aiq/eval/runtime_event_subscriber.py +0 -52
  158. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  159. aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
  160. aiq/eval/swe_bench_evaluator/register.py +0 -36
  161. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  162. aiq/eval/trajectory_evaluator/evaluate.py +0 -75
  163. aiq/eval/trajectory_evaluator/register.py +0 -40
  164. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  165. aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
  166. aiq/eval/tunable_rag_evaluator/register.py +0 -52
  167. aiq/eval/usage_stats.py +0 -41
  168. aiq/eval/utils/__init__.py +0 -0
  169. aiq/eval/utils/output_uploader.py +0 -140
  170. aiq/eval/utils/tqdm_position_registry.py +0 -40
  171. aiq/eval/utils/weave_eval.py +0 -184
  172. aiq/experimental/__init__.py +0 -0
  173. aiq/experimental/decorators/__init__.py +0 -0
  174. aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
  175. aiq/experimental/inference_time_scaling/__init__.py +0 -0
  176. aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
  177. aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
  178. aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
  179. aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
  180. aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
  181. aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
  182. aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
  183. aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
  184. aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
  185. aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
  186. aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
  187. aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
  188. aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
  189. aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
  190. aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
  191. aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
  192. aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
  193. aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
  194. aiq/experimental/inference_time_scaling/register.py +0 -36
  195. aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
  196. aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
  197. aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
  198. aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
  199. aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
  200. aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
  201. aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
  202. aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
  203. aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
  204. aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
  205. aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
  206. aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
  207. aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
  208. aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
  209. aiq/front_ends/__init__.py +0 -14
  210. aiq/front_ends/console/__init__.py +0 -14
  211. aiq/front_ends/console/authentication_flow_handler.py +0 -233
  212. aiq/front_ends/console/console_front_end_config.py +0 -32
  213. aiq/front_ends/console/console_front_end_plugin.py +0 -96
  214. aiq/front_ends/console/register.py +0 -25
  215. aiq/front_ends/cron/__init__.py +0 -14
  216. aiq/front_ends/fastapi/__init__.py +0 -14
  217. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  218. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
  219. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
  220. aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
  221. aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
  222. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
  223. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
  224. aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
  225. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
  226. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
  227. aiq/front_ends/fastapi/job_store.py +0 -183
  228. aiq/front_ends/fastapi/main.py +0 -72
  229. aiq/front_ends/fastapi/message_handler.py +0 -298
  230. aiq/front_ends/fastapi/message_validator.py +0 -345
  231. aiq/front_ends/fastapi/register.py +0 -25
  232. aiq/front_ends/fastapi/response_helpers.py +0 -195
  233. aiq/front_ends/fastapi/step_adaptor.py +0 -321
  234. aiq/front_ends/mcp/__init__.py +0 -14
  235. aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
  236. aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
  237. aiq/front_ends/mcp/register.py +0 -27
  238. aiq/front_ends/mcp/tool_converter.py +0 -242
  239. aiq/front_ends/register.py +0 -22
  240. aiq/front_ends/simple_base/__init__.py +0 -14
  241. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
  242. aiq/llm/__init__.py +0 -0
  243. aiq/llm/aws_bedrock_llm.py +0 -57
  244. aiq/llm/nim_llm.py +0 -46
  245. aiq/llm/openai_llm.py +0 -46
  246. aiq/llm/register.py +0 -23
  247. aiq/llm/utils/__init__.py +0 -14
  248. aiq/llm/utils/env_config_value.py +0 -94
  249. aiq/llm/utils/error.py +0 -17
  250. aiq/memory/__init__.py +0 -20
  251. aiq/memory/interfaces.py +0 -183
  252. aiq/memory/models.py +0 -112
  253. aiq/meta/module_to_distro.json +0 -3
  254. aiq/meta/pypi.md +0 -58
  255. aiq/object_store/__init__.py +0 -20
  256. aiq/object_store/in_memory_object_store.py +0 -76
  257. aiq/object_store/interfaces.py +0 -84
  258. aiq/object_store/models.py +0 -36
  259. aiq/object_store/register.py +0 -20
  260. aiq/observability/__init__.py +0 -14
  261. aiq/observability/exporter/__init__.py +0 -14
  262. aiq/observability/exporter/base_exporter.py +0 -449
  263. aiq/observability/exporter/exporter.py +0 -78
  264. aiq/observability/exporter/file_exporter.py +0 -33
  265. aiq/observability/exporter/processing_exporter.py +0 -322
  266. aiq/observability/exporter/raw_exporter.py +0 -52
  267. aiq/observability/exporter/span_exporter.py +0 -265
  268. aiq/observability/exporter_manager.py +0 -335
  269. aiq/observability/mixin/__init__.py +0 -14
  270. aiq/observability/mixin/batch_config_mixin.py +0 -26
  271. aiq/observability/mixin/collector_config_mixin.py +0 -23
  272. aiq/observability/mixin/file_mixin.py +0 -288
  273. aiq/observability/mixin/file_mode.py +0 -23
  274. aiq/observability/mixin/resource_conflict_mixin.py +0 -134
  275. aiq/observability/mixin/serialize_mixin.py +0 -61
  276. aiq/observability/mixin/type_introspection_mixin.py +0 -183
  277. aiq/observability/processor/__init__.py +0 -14
  278. aiq/observability/processor/batching_processor.py +0 -309
  279. aiq/observability/processor/callback_processor.py +0 -42
  280. aiq/observability/processor/intermediate_step_serializer.py +0 -28
  281. aiq/observability/processor/processor.py +0 -71
  282. aiq/observability/register.py +0 -96
  283. aiq/observability/utils/__init__.py +0 -14
  284. aiq/observability/utils/dict_utils.py +0 -236
  285. aiq/observability/utils/time_utils.py +0 -31
  286. aiq/plugins/.namespace +0 -1
  287. aiq/profiler/__init__.py +0 -0
  288. aiq/profiler/calc/__init__.py +0 -14
  289. aiq/profiler/calc/calc_runner.py +0 -627
  290. aiq/profiler/calc/calculations.py +0 -288
  291. aiq/profiler/calc/data_models.py +0 -188
  292. aiq/profiler/calc/plot.py +0 -345
  293. aiq/profiler/callbacks/__init__.py +0 -0
  294. aiq/profiler/callbacks/agno_callback_handler.py +0 -295
  295. aiq/profiler/callbacks/base_callback_class.py +0 -20
  296. aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
  297. aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
  298. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
  299. aiq/profiler/callbacks/token_usage_base_model.py +0 -27
  300. aiq/profiler/data_frame_row.py +0 -51
  301. aiq/profiler/data_models.py +0 -24
  302. aiq/profiler/decorators/__init__.py +0 -0
  303. aiq/profiler/decorators/framework_wrapper.py +0 -131
  304. aiq/profiler/decorators/function_tracking.py +0 -254
  305. aiq/profiler/forecasting/__init__.py +0 -0
  306. aiq/profiler/forecasting/config.py +0 -18
  307. aiq/profiler/forecasting/model_trainer.py +0 -75
  308. aiq/profiler/forecasting/models/__init__.py +0 -22
  309. aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
  310. aiq/profiler/forecasting/models/linear_model.py +0 -196
  311. aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
  312. aiq/profiler/inference_metrics_model.py +0 -28
  313. aiq/profiler/inference_optimization/__init__.py +0 -0
  314. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  315. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
  316. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
  317. aiq/profiler/inference_optimization/data_models.py +0 -386
  318. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  319. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
  320. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
  321. aiq/profiler/inference_optimization/llm_metrics.py +0 -212
  322. aiq/profiler/inference_optimization/prompt_caching.py +0 -163
  323. aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
  324. aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
  325. aiq/profiler/intermediate_property_adapter.py +0 -102
  326. aiq/profiler/profile_runner.py +0 -473
  327. aiq/profiler/utils.py +0 -184
  328. aiq/registry_handlers/__init__.py +0 -0
  329. aiq/registry_handlers/local/__init__.py +0 -0
  330. aiq/registry_handlers/local/local_handler.py +0 -176
  331. aiq/registry_handlers/local/register_local.py +0 -37
  332. aiq/registry_handlers/metadata_factory.py +0 -60
  333. aiq/registry_handlers/package_utils.py +0 -567
  334. aiq/registry_handlers/pypi/__init__.py +0 -0
  335. aiq/registry_handlers/pypi/pypi_handler.py +0 -251
  336. aiq/registry_handlers/pypi/register_pypi.py +0 -40
  337. aiq/registry_handlers/register.py +0 -21
  338. aiq/registry_handlers/registry_handler_base.py +0 -157
  339. aiq/registry_handlers/rest/__init__.py +0 -0
  340. aiq/registry_handlers/rest/register_rest.py +0 -56
  341. aiq/registry_handlers/rest/rest_handler.py +0 -237
  342. aiq/registry_handlers/schemas/__init__.py +0 -0
  343. aiq/registry_handlers/schemas/headers.py +0 -42
  344. aiq/registry_handlers/schemas/package.py +0 -68
  345. aiq/registry_handlers/schemas/publish.py +0 -63
  346. aiq/registry_handlers/schemas/pull.py +0 -82
  347. aiq/registry_handlers/schemas/remove.py +0 -36
  348. aiq/registry_handlers/schemas/search.py +0 -91
  349. aiq/registry_handlers/schemas/status.py +0 -47
  350. aiq/retriever/__init__.py +0 -0
  351. aiq/retriever/interface.py +0 -37
  352. aiq/retriever/milvus/__init__.py +0 -14
  353. aiq/retriever/milvus/register.py +0 -81
  354. aiq/retriever/milvus/retriever.py +0 -228
  355. aiq/retriever/models.py +0 -74
  356. aiq/retriever/nemo_retriever/__init__.py +0 -14
  357. aiq/retriever/nemo_retriever/register.py +0 -60
  358. aiq/retriever/nemo_retriever/retriever.py +0 -190
  359. aiq/retriever/register.py +0 -22
  360. aiq/runtime/__init__.py +0 -14
  361. aiq/runtime/loader.py +0 -215
  362. aiq/runtime/runner.py +0 -190
  363. aiq/runtime/session.py +0 -158
  364. aiq/runtime/user_metadata.py +0 -130
  365. aiq/settings/__init__.py +0 -0
  366. aiq/settings/global_settings.py +0 -318
  367. aiq/test/.namespace +0 -1
  368. aiq/tool/__init__.py +0 -0
  369. aiq/tool/chat_completion.py +0 -74
  370. aiq/tool/code_execution/README.md +0 -151
  371. aiq/tool/code_execution/__init__.py +0 -0
  372. aiq/tool/code_execution/code_sandbox.py +0 -267
  373. aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
  374. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
  375. aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
  376. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
  377. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
  378. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
  379. aiq/tool/code_execution/register.py +0 -74
  380. aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
  381. aiq/tool/code_execution/utils.py +0 -100
  382. aiq/tool/datetime_tools.py +0 -42
  383. aiq/tool/document_search.py +0 -141
  384. aiq/tool/github_tools/__init__.py +0 -0
  385. aiq/tool/github_tools/create_github_commit.py +0 -133
  386. aiq/tool/github_tools/create_github_issue.py +0 -87
  387. aiq/tool/github_tools/create_github_pr.py +0 -106
  388. aiq/tool/github_tools/get_github_file.py +0 -106
  389. aiq/tool/github_tools/get_github_issue.py +0 -166
  390. aiq/tool/github_tools/get_github_pr.py +0 -256
  391. aiq/tool/github_tools/update_github_issue.py +0 -100
  392. aiq/tool/mcp/__init__.py +0 -14
  393. aiq/tool/mcp/exceptions.py +0 -142
  394. aiq/tool/mcp/mcp_client.py +0 -255
  395. aiq/tool/mcp/mcp_tool.py +0 -96
  396. aiq/tool/memory_tools/__init__.py +0 -0
  397. aiq/tool/memory_tools/add_memory_tool.py +0 -79
  398. aiq/tool/memory_tools/delete_memory_tool.py +0 -67
  399. aiq/tool/memory_tools/get_memory_tool.py +0 -72
  400. aiq/tool/nvidia_rag.py +0 -95
  401. aiq/tool/register.py +0 -38
  402. aiq/tool/retriever.py +0 -89
  403. aiq/tool/server_tools.py +0 -66
  404. aiq/utils/__init__.py +0 -0
  405. aiq/utils/data_models/__init__.py +0 -0
  406. aiq/utils/data_models/schema_validator.py +0 -58
  407. aiq/utils/debugging_utils.py +0 -43
  408. aiq/utils/dump_distro_mapping.py +0 -32
  409. aiq/utils/exception_handlers/__init__.py +0 -0
  410. aiq/utils/exception_handlers/automatic_retries.py +0 -289
  411. aiq/utils/exception_handlers/mcp.py +0 -211
  412. aiq/utils/exception_handlers/schemas.py +0 -114
  413. aiq/utils/io/__init__.py +0 -0
  414. aiq/utils/io/model_processing.py +0 -28
  415. aiq/utils/io/yaml_tools.py +0 -119
  416. aiq/utils/log_utils.py +0 -37
  417. aiq/utils/metadata_utils.py +0 -74
  418. aiq/utils/optional_imports.py +0 -142
  419. aiq/utils/producer_consumer_queue.py +0 -178
  420. aiq/utils/reactive/__init__.py +0 -0
  421. aiq/utils/reactive/base/__init__.py +0 -0
  422. aiq/utils/reactive/base/observable_base.py +0 -65
  423. aiq/utils/reactive/base/observer_base.py +0 -55
  424. aiq/utils/reactive/base/subject_base.py +0 -79
  425. aiq/utils/reactive/observable.py +0 -59
  426. aiq/utils/reactive/observer.py +0 -76
  427. aiq/utils/reactive/subject.py +0 -131
  428. aiq/utils/reactive/subscription.py +0 -49
  429. aiq/utils/settings/__init__.py +0 -0
  430. aiq/utils/settings/global_settings.py +0 -197
  431. aiq/utils/string_utils.py +0 -38
  432. aiq/utils/type_converter.py +0 -290
  433. aiq/utils/type_utils.py +0 -484
  434. aiq/utils/url_utils.py +0 -27
  435. aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
  436. aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
  437. aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
  438. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
  439. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
  440. aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
  441. {aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2rc9.dist-info}/WHEEL +0 -0
@@ -1,184 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- from typing import Any
19
-
20
- from aiq.eval.evaluator.evaluator_model import EvalInput
21
- from aiq.eval.evaluator.evaluator_model import EvalInputItem
22
- from aiq.eval.evaluator.evaluator_model import EvalOutput
23
- from aiq.eval.usage_stats import UsageStats
24
- from aiq.eval.usage_stats import UsageStatsItem
25
- from aiq.profiler.data_models import ProfilerResults
26
-
27
- logger = logging.getLogger(__name__)
28
-
29
-
30
- class WeaveEvaluationIntegration: # pylint: disable=too-many-public-methods
31
- """
32
- Class to handle all Weave integration functionality.
33
- """
34
-
35
- def __init__(self):
36
- self.available = False
37
- self.client = None
38
- self.eval_logger = None
39
- self.pred_loggers = {}
40
-
41
- try:
42
- from weave.flow.eval_imperative import EvaluationLogger
43
- from weave.flow.eval_imperative import ScoreLogger
44
- from weave.trace.context import weave_client_context
45
- self.EvaluationLogger = EvaluationLogger
46
- self.ScoreLogger = ScoreLogger
47
- self.weave_client_context = weave_client_context
48
- self.available = True
49
- except ImportError:
50
- self.available = False
51
- # we simply don't do anything if weave is not available
52
- pass
53
-
54
- def initialize_client(self):
55
- """Initialize the Weave client if available."""
56
- if not self.available:
57
- return False
58
-
59
- try:
60
- self.client = self.weave_client_context.require_weave_client()
61
- return self.client is not None
62
- except Exception:
63
- self.client = None
64
- return False
65
-
66
- def _get_prediction_inputs(self, item: EvalInputItem):
67
- """Get the inputs for displaying in the UI.
68
- The following fields are excluded as they are too large to display in the UI:
69
- - full_dataset_entry
70
- - expected_trajectory
71
- - trajectory
72
-
73
- output_obj is excluded because it is displayed separately.
74
- """
75
- include = {"id", "input_obj", "expected_output_obj"}
76
- return item.model_dump(include=include)
77
-
78
- def _get_weave_dataset(self, eval_input: EvalInput):
79
- """Get the full dataset for Weave."""
80
- return [item.full_dataset_entry for item in eval_input.eval_input_items]
81
-
82
- def initialize_logger(self, workflow_alias: str, eval_input: EvalInput, config: Any):
83
- """Initialize the Weave evaluation logger."""
84
- if not self.client and not self.initialize_client():
85
- # lazy init the client
86
- return False
87
-
88
- try:
89
- weave_dataset = self._get_weave_dataset(eval_input)
90
- config_dict = config.model_dump(mode="json")
91
- config_dict["name"] = workflow_alias
92
- self.eval_logger = self.EvaluationLogger(model=config_dict, dataset=weave_dataset)
93
- self.pred_loggers = {}
94
-
95
- return True
96
- except Exception as e:
97
- self.eval_logger = None
98
- logger.warning("Failed to initialize Weave `EvaluationLogger`: %s", e)
99
-
100
- return False
101
-
102
- def log_prediction(self, item: EvalInputItem, output: Any):
103
- """Log a prediction to Weave."""
104
- if not self.eval_logger:
105
- return
106
-
107
- pred_logger = self.eval_logger.log_prediction(inputs=self._get_prediction_inputs(item), output=output)
108
- self.pred_loggers[item.id] = pred_logger
109
-
110
- async def log_usage_stats(self, item: EvalInputItem, usage_stats_item: UsageStatsItem):
111
- """Log usage stats to Weave."""
112
- if not self.eval_logger:
113
- return
114
-
115
- # log each usage stat as a score
116
- await self.pred_loggers[item.id].alog_score(scorer="wf_runtime", score=usage_stats_item.runtime)
117
-
118
- # log the total tokens for this item, per-llm tokens can be exported later if needed
119
- await self.pred_loggers[item.id].alog_score(scorer="wf_tokens", score=usage_stats_item.total_tokens)
120
-
121
- async def alog_score(self, eval_output: EvalOutput, evaluator_name: str):
122
- """Log scores for evaluation outputs."""
123
- if not self.eval_logger:
124
- return
125
-
126
- # Create coroutines for all score logging operations
127
- coros = []
128
- for eval_output_item in eval_output.eval_output_items:
129
- if eval_output_item.id in self.pred_loggers:
130
- coros.append(self.pred_loggers[eval_output_item.id].alog_score(
131
- scorer=evaluator_name,
132
- score=eval_output_item.score,
133
- ))
134
-
135
- # Execute all coroutines concurrently
136
- if coros:
137
- await asyncio.gather(*coros)
138
-
139
- async def afinish_loggers(self):
140
- """Finish all prediction loggers."""
141
- if not self.eval_logger:
142
- return
143
-
144
- async def _finish_one(pred_logger):
145
- if hasattr(pred_logger, '_has_finished') and not pred_logger._has_finished:
146
- return
147
- # run the *blocking* finish() in a thread so we don't nest loops
148
- await asyncio.to_thread(pred_logger.finish)
149
-
150
- await asyncio.gather(*[_finish_one(pl) for pl in self.pred_loggers.values()])
151
-
152
- def _log_profiler_metrics(self, profiler_results: ProfilerResults, usage_stats: UsageStats) -> dict[str, Any]:
153
- """Log profiler metrics to Weave."""
154
- profile_metrics = {}
155
- if profiler_results.llm_latency_ci:
156
- profile_metrics["llm_latency_p95"] = profiler_results.llm_latency_ci.p95
157
- if profiler_results.workflow_runtime_metrics:
158
- profile_metrics["wf_runtime_p95"] = profiler_results.workflow_runtime_metrics.p95
159
-
160
- # TODO:get the LLM tokens from the usage stats and log them
161
- profile_metrics["total_runtime"] = usage_stats.total_runtime
162
-
163
- return profile_metrics
164
-
165
- def log_summary(self,
166
- usage_stats: UsageStats,
167
- evaluation_results: list[tuple[str, EvalOutput]],
168
- profiler_results: ProfilerResults):
169
- """Log summary statistics to Weave."""
170
- if not self.eval_logger:
171
- return
172
-
173
- summary = {}
174
- # add evaluation results to the summary
175
- for evaluator_name, eval_output in evaluation_results:
176
- summary[evaluator_name] = eval_output.average_score
177
-
178
- # add profiler metrics to the summary
179
- profile_metrics = self._log_profiler_metrics(profiler_results, usage_stats)
180
- summary.update(profile_metrics)
181
-
182
- # Log the summary to finish the evaluation, disable auto-summarize
183
- # as we will be adding profiler metrics to the summary
184
- self.eval_logger.log_summary(summary, auto_summarize=False)
File without changes
File without changes
@@ -1,130 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import functools
17
- import inspect
18
- import logging
19
- from typing import Any
20
-
21
- logger = logging.getLogger(__name__)
22
-
23
- BASE_WARNING_MESSAGE = ("is experimental and the API may change in future releases. "
24
- "Future versions may introduce breaking changes without notice.")
25
-
26
- _warning_issued = set()
27
-
28
-
29
- def issue_experimental_warning(function_name: str,
30
- feature_name: str | None = None,
31
- metadata: dict[str, Any] | None = None):
32
- """
33
- Log a warning message that the function is experimental.
34
-
35
- A warning is emitted only once per function. When a ``metadata`` dict
36
- is supplied, it is appended to the log entry to provide extra context
37
- (e.g., version, author, feature flag).
38
- """
39
- if function_name not in _warning_issued:
40
- if (feature_name):
41
- warning_message = f"The {feature_name} feature {BASE_WARNING_MESSAGE}"
42
- else:
43
- warning_message = f"This function {BASE_WARNING_MESSAGE}"
44
-
45
- warning_message += f" Function: {function_name}"
46
-
47
- if (metadata):
48
- warning_message += f" | Metadata: {metadata}"
49
-
50
- # Issue warning and save function name to avoid duplicate warnings
51
- logger.warning(warning_message)
52
-
53
- _warning_issued.add(function_name)
54
-
55
-
56
- def aiq_experimental(func: Any = None, *, feature_name: str | None = None, metadata: dict[str, Any] | None = None):
57
- """
58
- Decorator that can wrap any type of function (sync, async, generator,
59
- async generator) and logs a warning that the function is experimental.
60
-
61
- Args:
62
- func: The function to be decorated.
63
- feature_name: Optional name of the feature that is experimental. If provided, the warning will be
64
- prefixed with "The <feature_name> feature is experimental".
65
- metadata: Optional dictionary of metadata to log with the warning. This can include information
66
- like version, author, etc. If provided, the metadata will be
67
- logged alongside the experimental warning.
68
- """
69
- function_name: str = f"{func.__module__}.{func.__qualname__}" if func else "<unknown_function>"
70
-
71
- # If called as @track_function(...) but not immediately passed a function
72
- if func is None:
73
-
74
- def decorator_wrapper(actual_func):
75
- return aiq_experimental(actual_func, feature_name=feature_name, metadata=metadata)
76
-
77
- return decorator_wrapper
78
-
79
- # --- Validate metadata ---
80
- if metadata is not None:
81
- if not isinstance(metadata, dict):
82
- raise TypeError("metadata must be a dict[str, Any].")
83
- if any(not isinstance(k, str) for k in metadata.keys()):
84
- raise TypeError("All metadata keys must be strings.")
85
-
86
- # --- Now detect the function type and wrap accordingly ---
87
- if inspect.isasyncgenfunction(func):
88
- # ---------------------
89
- # ASYNC GENERATOR
90
- # ---------------------
91
-
92
- @functools.wraps(func)
93
- async def async_gen_wrapper(*args, **kwargs):
94
- issue_experimental_warning(function_name, feature_name, metadata)
95
- async for item in func(*args, **kwargs):
96
- yield item # yield the original item
97
-
98
- return async_gen_wrapper
99
-
100
- if inspect.iscoroutinefunction(func):
101
- # ---------------------
102
- # ASYNC FUNCTION
103
- # ---------------------
104
- @functools.wraps(func)
105
- async def async_wrapper(*args, **kwargs):
106
- issue_experimental_warning(function_name, feature_name, metadata)
107
- result = await func(*args, **kwargs)
108
- return result
109
-
110
- return async_wrapper
111
-
112
- if inspect.isgeneratorfunction(func):
113
- # ---------------------
114
- # SYNC GENERATOR
115
- # ---------------------
116
- @functools.wraps(func)
117
- def sync_gen_wrapper(*args, **kwargs):
118
- issue_experimental_warning(function_name, feature_name, metadata)
119
- for item in func(*args, **kwargs):
120
- yield item # yield the original item
121
-
122
- return sync_gen_wrapper
123
-
124
- @functools.wraps(func)
125
- def sync_wrapper(*args, **kwargs):
126
- issue_experimental_warning(function_name, feature_name, metadata)
127
- result = func(*args, **kwargs)
128
- return result
129
-
130
- return sync_wrapper
File without changes
@@ -1,147 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- import re
19
-
20
- from aiq.builder.builder import Builder
21
- from aiq.builder.framework_enum import LLMFrameworkEnum
22
- from aiq.cli.register_workflow import register_its_strategy
23
- from aiq.data_models.its_strategy import ITSStrategyBaseConfig
24
- from aiq.experimental.inference_time_scaling.models.editor_config import IterativePlanRefinementConfig
25
- from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
26
- from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
27
- from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
28
- from aiq.experimental.inference_time_scaling.models.strategy_base import StrategyBase
29
- from aiq.utils.io.model_processing import remove_r1_think_tags
30
-
31
- logger = logging.getLogger(__name__)
32
-
33
-
34
- class IterativePlanRefinementEditor(StrategyBase):
35
- """
36
- A planner that generates an initial plan, then refines it multiple times
37
- using the same LLM. Each iteration updates the plan to (hopefully) be better.
38
- """
39
-
40
- def __init__(self, config: ITSStrategyBaseConfig) -> None:
41
- super().__init__(config)
42
- self.llm_bound = None
43
-
44
- def supported_pipeline_types(self) -> [PipelineTypeEnum]:
45
- return [PipelineTypeEnum.PLANNING]
46
-
47
- def stage_type(self) -> StageTypeEnum:
48
- return StageTypeEnum.EDITING
49
-
50
- async def build_components(self, builder: Builder) -> None:
51
- """
52
- Build the components required for the iterative planner.
53
- """
54
- logger.debug("Building components for IterativePlanRefinementEditor")
55
- self.llm_bound = await builder.get_llm(self.config.editor_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
56
-
57
- async def refine_single(self, prompt: str, context: str, its_item: ITSItem, prompt_idx: int) -> ITSItem:
58
- from langchain_core.language_models import BaseChatModel
59
- from langchain_core.prompts import PromptTemplate
60
-
61
- if not isinstance(self.llm_bound, BaseChatModel):
62
- raise ValueError("editor_llm must be a BaseChatModel instance for iterative plan refinement.")
63
-
64
- llm: BaseChatModel = self.llm_bound
65
-
66
- # Refinement loop
67
- refinement_template = PromptTemplate(
68
- template=self.config.refinement_template,
69
- input_variables=["current_plan", "context", "original_prompt"],
70
- validate_template=True,
71
- )
72
-
73
- current_plan = its_item.plan
74
- for iteration in range(1, self.config.num_iterations + 1):
75
- logger.info("Refinement iteration %d / %d for prompt %d", iteration, self.config.num_iterations, prompt_idx)
76
- refine_prompt = (await refinement_template.ainvoke({
77
- "current_plan": current_plan, "context": context, "original_prompt": prompt
78
- })).to_string()
79
-
80
- refine_response = await llm.ainvoke(refine_prompt)
81
- refined_plan = remove_r1_think_tags(
82
- refine_response.content if hasattr(refine_response, 'content') else str(refine_response))
83
- refined_plan = re.sub(r'(?i)^\s*EDITED PLAN:\s*', '', refined_plan).strip()
84
- if refined_plan:
85
- current_plan = refined_plan
86
- else:
87
- logger.warning("Refinement iteration %d for prompt %d produced an empty plan; keeping existing plan.",
88
- iteration,
89
- prompt_idx)
90
-
91
- logger.info("IterativePlanRefinementPlanner produced a final plan after %d iterations.",
92
- self.config.num_iterations)
93
-
94
- its_item.plan = current_plan
95
- # Return a single final plan
96
- return its_item
97
-
98
- async def ainvoke(self,
99
- items: list[ITSItem],
100
- original_prompt: str | None = None,
101
- agent_context: str | None = None,
102
- **kwargs) -> list[ITSItem]:
103
- """
104
- Runs the iterative plan refinement process on the provided planning items.
105
-
106
- Each planning item is refined in parallel the configured number of times. Default is 3.
107
-
108
- Args:
109
- items (list[ITSItem]): The planning items to refine.
110
- original_prompt (str): The original prompt used to generate the plans.
111
- agent_context (str): The context for the agent.
112
-
113
- Returns:
114
- list[ITSItem]: The refined planning items.
115
- """
116
-
117
- if not original_prompt or not agent_context:
118
- raise ValueError("Arguments original_prompt and agent_context must be provdied.")
119
-
120
- # Generate feedback for each planning item concurrently
121
- tasks = [
122
- self.refine_single(prompt=original_prompt, context=agent_context, its_item=item, prompt_idx=i + 1)
123
- for i, item in enumerate(items)
124
- ]
125
-
126
- # Run the tasks concurrently and gather results
127
- refined_planning_items = await asyncio.gather(*tasks)
128
-
129
- return refined_planning_items
130
-
131
-
132
- @register_its_strategy(config_type=IterativePlanRefinementConfig)
133
- async def register_iterative_plan_refinement_editor(config: IterativePlanRefinementConfig, builder: Builder):
134
- """
135
- Register the IterativePlanRefinementEditor strategy.
136
-
137
- Args:
138
- config (IterativePlanRefinementConfig): The configuration for the strategy.
139
-
140
- Returns:
141
- IterativePlanRefinementEditor: The registered strategy instance.
142
- """
143
-
144
- editor = IterativePlanRefinementEditor(config)
145
- await editor.build_components(builder=builder)
146
-
147
- yield editor
@@ -1,204 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- import re
19
-
20
- from aiq.builder.builder import Builder
21
- from aiq.builder.framework_enum import LLMFrameworkEnum
22
- from aiq.cli.register_workflow import register_its_strategy
23
- from aiq.data_models.its_strategy import ITSStrategyBaseConfig
24
- from aiq.experimental.inference_time_scaling.models.editor_config import LLMAsAJudgeEditorConfig
25
- from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
26
- from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
27
- from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
28
- from aiq.experimental.inference_time_scaling.models.strategy_base import StrategyBase
29
- from aiq.utils.io.model_processing import remove_r1_think_tags
30
-
31
- logger = logging.getLogger(__name__)
32
-
33
-
34
- class LLMAsAJudgeEditor(StrategyBase):
35
- """
36
- Given a list of PlanningItems, uses a feedback LLM to generate feedback on each plan
37
- Then edits the plan based on feedback.
38
- """
39
-
40
- def __init__(self, config: ITSStrategyBaseConfig) -> None:
41
- super().__init__(config)
42
- self.feedback_llm = None
43
- self.editing_llm = None
44
-
45
- async def build_components(self, builder: Builder) -> None:
46
- """
47
- Build the components required for the editor.
48
- """
49
- # Get the feedback LLM
50
- self.feedback_llm = await builder.get_llm(self.config.feedback_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
51
-
52
- self.editing_llm = await builder.get_llm(self.config.editing_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
53
-
54
- def supported_pipeline_types(self) -> [PipelineTypeEnum]:
55
- return [PipelineTypeEnum.PLANNING]
56
-
57
- def stage_type(self) -> StageTypeEnum:
58
- return StageTypeEnum.EDITING
59
-
60
- async def generate_feedback(self, llm, template, context: str, prompt: str, item: ITSItem) -> ITSItem:
61
- """
62
- Helper function to generate feedback for a given planning item using the provided prompt.
63
- """
64
-
65
- prompt = await template.ainvoke(
66
- input={
67
- "context": context,
68
- "original_prompt": prompt, # Original prompt used to generate the plans
69
- "plan": item.plan,
70
- "num_feedback": self.config.num_feedback
71
- })
72
-
73
- feedback_result = await llm.ainvoke(prompt.to_string())
74
- if not feedback_result:
75
- logger.warning(f"No feedback generated for plan: {item.plan}.")
76
- return item
77
-
78
- # Update the planning item with the generated feedback
79
- cleaned = remove_r1_think_tags(
80
- feedback_result.content if hasattr(feedback_result, 'content') else str(feedback_result))
81
-
82
- # Feedback is the string following 'FEEDBACK:'. Use Regex to extract
83
- cleaned = re.sub(r'(?i)^\s*FEEDBACK:\s*', '', cleaned).strip()
84
- if not cleaned:
85
- logger.warning(f"Feedback was empty for plan: {item.plan}.")
86
- return item
87
-
88
- item.feedback = cleaned # Set the feedback in the ITSItem
89
-
90
- return item
91
-
92
- async def edit_plan(self, llm, template, context: str, prompt: str, item: ITSItem) -> ITSItem:
93
- """
94
- Helper function to edit a plan based on feedback using the provided prompt.
95
- """
96
-
97
- if not item.feedback:
98
- logger.warning(f"No feedback available for plan: {item.plan}. Cannot edit.")
99
- return item
100
-
101
- prompt = await template.ainvoke(
102
- input={
103
- "context": context,
104
- "original_prompt": prompt, # Original prompt used to generate the plans
105
- "plan": item.plan,
106
- "feedback": item.feedback
107
- })
108
-
109
- editing_result = await llm.ainvoke(prompt.to_string())
110
- if not editing_result:
111
- logger.warning(f"No editing result generated for plan: {item.plan}.")
112
- return item
113
-
114
- # Update the planning item with the edited plan
115
- cleaned = remove_r1_think_tags(
116
- editing_result.content if hasattr(editing_result, 'content') else str(editing_result))
117
-
118
- # Plan is the string following 'EDITED PLAN:'. Use Regex to extract
119
- cleaned = re.sub(r'(?i)^\s*EDITED PLAN:\s*', '', cleaned).strip()
120
- if not cleaned:
121
- logger.warning(f"Edited plan was empty for plan: {item.plan}. Returning original.")
122
- return item
123
-
124
- # Update the plan in the PlanningItem
125
- item.plan = cleaned
126
-
127
- return item
128
-
129
- async def ainvoke(self,
130
- items: list[ITSItem],
131
- original_prompt: str | None = None,
132
- agent_context: str | None = None,
133
- **kwargs) -> list[ITSItem]:
134
- """
135
- Edit the provided planning items using a feedback LLM.
136
- """
137
- from langchain_core.language_models import BaseChatModel
138
- from langchain_core.prompts import PromptTemplate
139
-
140
- # assert self.config.feedback_llm is a BaseChatModel
141
- if not isinstance(self.feedback_llm, BaseChatModel):
142
- raise ValueError("The `feedback_llm` must be an instance of `BaseChatModel`.")
143
-
144
- # assert self.config.editing_llm is a BaseChatModel
145
- if not isinstance(self.editing_llm, BaseChatModel):
146
- raise ValueError("The `editing_llm` must be an instance of `BaseChatModel`.")
147
-
148
- feedback_model: BaseChatModel = self.feedback_llm
149
- editing_model: BaseChatModel = self.editing_llm
150
-
151
- feedback_template = PromptTemplate(template=self.config.feedback_template,
152
- input_variables=["context", "original_prompt", "plan", "num_feedback"],
153
- validate_template=True)
154
-
155
- editing_template = PromptTemplate(template=self.config.editor_template,
156
- input_variables=["context", "original_prompt", "plan", "feedback"],
157
- validate_template=True)
158
-
159
- # Generate feedback for each planning item concurrently
160
- feedback_tasks = [
161
- self.generate_feedback(
162
- llm=feedback_model,
163
- template=feedback_template,
164
- context=agent_context,
165
- prompt=original_prompt, # Original prompt used to generate the plans
166
- item=item) for item in items
167
- ]
168
- # Run the feedback tasks concurrently and gather results
169
- planning_items_with_feedback = await asyncio.gather(*feedback_tasks)
170
-
171
- if not planning_items_with_feedback:
172
- raise ValueError("No feedback was generated for the planning items. Please check the LLM response.")
173
-
174
- logger.info("Generated feedback for %d plans.", len(planning_items_with_feedback))
175
-
176
- # Now edit each planning item based on the feedback concurrently
177
- editing_tasks = [
178
- self.edit_plan(
179
- llm=editing_model,
180
- template=editing_template,
181
- context=agent_context,
182
- prompt=original_prompt, # Original prompt used to generate the plans
183
- item=item) for item in planning_items_with_feedback
184
- ]
185
- # Run the editing tasks concurrently and gather results
186
- edited_planning_items = await asyncio.gather(*editing_tasks)
187
-
188
- if not edited_planning_items:
189
- raise ValueError("No plans were edited. Please check the LLM response.")
190
-
191
- logger.info("Edited %d plans based on feedback.", len(edited_planning_items))
192
- return edited_planning_items
193
-
194
-
195
- @register_its_strategy(config_type=LLMAsAJudgeEditorConfig)
196
- async def register_llm_as_a_judge_editor(config: ITSStrategyBaseConfig, builder: Builder):
197
- """
198
- Register the LLMAsAJudgeEditor strategy with the provided configuration and builder.
199
- """
200
-
201
- editor = LLMAsAJudgeEditor(config)
202
- await editor.build_components(builder)
203
-
204
- yield editor