aiqtoolkit 1.1.0a20250503__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (314) hide show
  1. aiq/agent/__init__.py +0 -0
  2. aiq/agent/base.py +76 -0
  3. aiq/agent/dual_node.py +67 -0
  4. aiq/agent/react_agent/__init__.py +0 -0
  5. aiq/agent/react_agent/agent.py +322 -0
  6. aiq/agent/react_agent/output_parser.py +104 -0
  7. aiq/agent/react_agent/prompt.py +46 -0
  8. aiq/agent/react_agent/register.py +148 -0
  9. aiq/agent/reasoning_agent/__init__.py +0 -0
  10. aiq/agent/reasoning_agent/reasoning_agent.py +224 -0
  11. aiq/agent/register.py +23 -0
  12. aiq/agent/rewoo_agent/__init__.py +0 -0
  13. aiq/agent/rewoo_agent/agent.py +410 -0
  14. aiq/agent/rewoo_agent/prompt.py +108 -0
  15. aiq/agent/rewoo_agent/register.py +158 -0
  16. aiq/agent/tool_calling_agent/__init__.py +0 -0
  17. aiq/agent/tool_calling_agent/agent.py +123 -0
  18. aiq/agent/tool_calling_agent/register.py +105 -0
  19. aiq/builder/__init__.py +0 -0
  20. aiq/builder/builder.py +223 -0
  21. aiq/builder/component_utils.py +303 -0
  22. aiq/builder/context.py +212 -0
  23. aiq/builder/embedder.py +24 -0
  24. aiq/builder/eval_builder.py +116 -0
  25. aiq/builder/evaluator.py +29 -0
  26. aiq/builder/framework_enum.py +24 -0
  27. aiq/builder/front_end.py +73 -0
  28. aiq/builder/function.py +297 -0
  29. aiq/builder/function_base.py +376 -0
  30. aiq/builder/function_info.py +627 -0
  31. aiq/builder/intermediate_step_manager.py +127 -0
  32. aiq/builder/llm.py +25 -0
  33. aiq/builder/retriever.py +25 -0
  34. aiq/builder/user_interaction_manager.py +71 -0
  35. aiq/builder/workflow.py +143 -0
  36. aiq/builder/workflow_builder.py +749 -0
  37. aiq/cli/__init__.py +14 -0
  38. aiq/cli/cli_utils/__init__.py +0 -0
  39. aiq/cli/cli_utils/config_override.py +233 -0
  40. aiq/cli/cli_utils/validation.py +37 -0
  41. aiq/cli/commands/__init__.py +0 -0
  42. aiq/cli/commands/configure/__init__.py +0 -0
  43. aiq/cli/commands/configure/channel/__init__.py +0 -0
  44. aiq/cli/commands/configure/channel/add.py +28 -0
  45. aiq/cli/commands/configure/channel/channel.py +36 -0
  46. aiq/cli/commands/configure/channel/remove.py +30 -0
  47. aiq/cli/commands/configure/channel/update.py +30 -0
  48. aiq/cli/commands/configure/configure.py +33 -0
  49. aiq/cli/commands/evaluate.py +139 -0
  50. aiq/cli/commands/info/__init__.py +14 -0
  51. aiq/cli/commands/info/info.py +37 -0
  52. aiq/cli/commands/info/list_channels.py +32 -0
  53. aiq/cli/commands/info/list_components.py +129 -0
  54. aiq/cli/commands/registry/__init__.py +14 -0
  55. aiq/cli/commands/registry/publish.py +88 -0
  56. aiq/cli/commands/registry/pull.py +118 -0
  57. aiq/cli/commands/registry/registry.py +38 -0
  58. aiq/cli/commands/registry/remove.py +108 -0
  59. aiq/cli/commands/registry/search.py +155 -0
  60. aiq/cli/commands/start.py +250 -0
  61. aiq/cli/commands/uninstall.py +83 -0
  62. aiq/cli/commands/validate.py +47 -0
  63. aiq/cli/commands/workflow/__init__.py +14 -0
  64. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  65. aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
  66. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
  67. aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
  68. aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
  69. aiq/cli/commands/workflow/workflow.py +37 -0
  70. aiq/cli/commands/workflow/workflow_commands.py +313 -0
  71. aiq/cli/entrypoint.py +133 -0
  72. aiq/cli/main.py +44 -0
  73. aiq/cli/register_workflow.py +408 -0
  74. aiq/cli/type_registry.py +879 -0
  75. aiq/data_models/__init__.py +14 -0
  76. aiq/data_models/api_server.py +588 -0
  77. aiq/data_models/common.py +143 -0
  78. aiq/data_models/component.py +46 -0
  79. aiq/data_models/component_ref.py +135 -0
  80. aiq/data_models/config.py +349 -0
  81. aiq/data_models/dataset_handler.py +122 -0
  82. aiq/data_models/discovery_metadata.py +269 -0
  83. aiq/data_models/embedder.py +26 -0
  84. aiq/data_models/evaluate.py +104 -0
  85. aiq/data_models/evaluator.py +26 -0
  86. aiq/data_models/front_end.py +26 -0
  87. aiq/data_models/function.py +30 -0
  88. aiq/data_models/function_dependencies.py +64 -0
  89. aiq/data_models/interactive.py +237 -0
  90. aiq/data_models/intermediate_step.py +269 -0
  91. aiq/data_models/invocation_node.py +38 -0
  92. aiq/data_models/llm.py +26 -0
  93. aiq/data_models/logging.py +26 -0
  94. aiq/data_models/memory.py +26 -0
  95. aiq/data_models/profiler.py +53 -0
  96. aiq/data_models/registry_handler.py +26 -0
  97. aiq/data_models/retriever.py +30 -0
  98. aiq/data_models/step_adaptor.py +64 -0
  99. aiq/data_models/streaming.py +33 -0
  100. aiq/data_models/swe_bench_model.py +54 -0
  101. aiq/data_models/telemetry_exporter.py +26 -0
  102. aiq/embedder/__init__.py +0 -0
  103. aiq/embedder/langchain_client.py +41 -0
  104. aiq/embedder/nim_embedder.py +58 -0
  105. aiq/embedder/openai_embedder.py +42 -0
  106. aiq/embedder/register.py +24 -0
  107. aiq/eval/__init__.py +14 -0
  108. aiq/eval/config.py +42 -0
  109. aiq/eval/dataset_handler/__init__.py +0 -0
  110. aiq/eval/dataset_handler/dataset_downloader.py +106 -0
  111. aiq/eval/dataset_handler/dataset_filter.py +52 -0
  112. aiq/eval/dataset_handler/dataset_handler.py +169 -0
  113. aiq/eval/evaluate.py +323 -0
  114. aiq/eval/evaluator/__init__.py +14 -0
  115. aiq/eval/evaluator/evaluator_model.py +44 -0
  116. aiq/eval/intermediate_step_adapter.py +93 -0
  117. aiq/eval/rag_evaluator/__init__.py +0 -0
  118. aiq/eval/rag_evaluator/evaluate.py +138 -0
  119. aiq/eval/rag_evaluator/register.py +138 -0
  120. aiq/eval/register.py +23 -0
  121. aiq/eval/remote_workflow.py +128 -0
  122. aiq/eval/runtime_event_subscriber.py +52 -0
  123. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  124. aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
  125. aiq/eval/swe_bench_evaluator/register.py +36 -0
  126. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  127. aiq/eval/trajectory_evaluator/evaluate.py +118 -0
  128. aiq/eval/trajectory_evaluator/register.py +40 -0
  129. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  130. aiq/eval/tunable_rag_evaluator/evaluate.py +263 -0
  131. aiq/eval/tunable_rag_evaluator/register.py +50 -0
  132. aiq/eval/utils/__init__.py +0 -0
  133. aiq/eval/utils/output_uploader.py +131 -0
  134. aiq/eval/utils/tqdm_position_registry.py +40 -0
  135. aiq/front_ends/__init__.py +14 -0
  136. aiq/front_ends/console/__init__.py +14 -0
  137. aiq/front_ends/console/console_front_end_config.py +32 -0
  138. aiq/front_ends/console/console_front_end_plugin.py +107 -0
  139. aiq/front_ends/console/register.py +25 -0
  140. aiq/front_ends/cron/__init__.py +14 -0
  141. aiq/front_ends/fastapi/__init__.py +14 -0
  142. aiq/front_ends/fastapi/fastapi_front_end_config.py +150 -0
  143. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +103 -0
  144. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +607 -0
  145. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
  146. aiq/front_ends/fastapi/job_store.py +161 -0
  147. aiq/front_ends/fastapi/main.py +70 -0
  148. aiq/front_ends/fastapi/message_handler.py +279 -0
  149. aiq/front_ends/fastapi/message_validator.py +345 -0
  150. aiq/front_ends/fastapi/register.py +25 -0
  151. aiq/front_ends/fastapi/response_helpers.py +195 -0
  152. aiq/front_ends/fastapi/step_adaptor.py +315 -0
  153. aiq/front_ends/fastapi/websocket.py +148 -0
  154. aiq/front_ends/mcp/__init__.py +14 -0
  155. aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
  156. aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
  157. aiq/front_ends/mcp/register.py +27 -0
  158. aiq/front_ends/mcp/tool_converter.py +242 -0
  159. aiq/front_ends/register.py +22 -0
  160. aiq/front_ends/simple_base/__init__.py +14 -0
  161. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +52 -0
  162. aiq/llm/__init__.py +0 -0
  163. aiq/llm/nim_llm.py +45 -0
  164. aiq/llm/openai_llm.py +45 -0
  165. aiq/llm/register.py +22 -0
  166. aiq/llm/utils/__init__.py +14 -0
  167. aiq/llm/utils/env_config_value.py +94 -0
  168. aiq/llm/utils/error.py +17 -0
  169. aiq/memory/__init__.py +20 -0
  170. aiq/memory/interfaces.py +183 -0
  171. aiq/memory/models.py +102 -0
  172. aiq/meta/module_to_distro.json +3 -0
  173. aiq/meta/pypi.md +59 -0
  174. aiq/observability/__init__.py +0 -0
  175. aiq/observability/async_otel_listener.py +433 -0
  176. aiq/observability/register.py +99 -0
  177. aiq/plugins/.namespace +1 -0
  178. aiq/profiler/__init__.py +0 -0
  179. aiq/profiler/callbacks/__init__.py +0 -0
  180. aiq/profiler/callbacks/agno_callback_handler.py +295 -0
  181. aiq/profiler/callbacks/base_callback_class.py +20 -0
  182. aiq/profiler/callbacks/langchain_callback_handler.py +278 -0
  183. aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
  184. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
  185. aiq/profiler/callbacks/token_usage_base_model.py +27 -0
  186. aiq/profiler/data_frame_row.py +51 -0
  187. aiq/profiler/decorators/__init__.py +0 -0
  188. aiq/profiler/decorators/framework_wrapper.py +131 -0
  189. aiq/profiler/decorators/function_tracking.py +254 -0
  190. aiq/profiler/forecasting/__init__.py +0 -0
  191. aiq/profiler/forecasting/config.py +18 -0
  192. aiq/profiler/forecasting/model_trainer.py +75 -0
  193. aiq/profiler/forecasting/models/__init__.py +22 -0
  194. aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
  195. aiq/profiler/forecasting/models/linear_model.py +196 -0
  196. aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
  197. aiq/profiler/inference_metrics_model.py +25 -0
  198. aiq/profiler/inference_optimization/__init__.py +0 -0
  199. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  200. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +452 -0
  201. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
  202. aiq/profiler/inference_optimization/data_models.py +386 -0
  203. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  204. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
  205. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
  206. aiq/profiler/inference_optimization/llm_metrics.py +212 -0
  207. aiq/profiler/inference_optimization/prompt_caching.py +163 -0
  208. aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
  209. aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
  210. aiq/profiler/intermediate_property_adapter.py +102 -0
  211. aiq/profiler/profile_runner.py +433 -0
  212. aiq/profiler/utils.py +184 -0
  213. aiq/registry_handlers/__init__.py +0 -0
  214. aiq/registry_handlers/local/__init__.py +0 -0
  215. aiq/registry_handlers/local/local_handler.py +176 -0
  216. aiq/registry_handlers/local/register_local.py +37 -0
  217. aiq/registry_handlers/metadata_factory.py +60 -0
  218. aiq/registry_handlers/package_utils.py +198 -0
  219. aiq/registry_handlers/pypi/__init__.py +0 -0
  220. aiq/registry_handlers/pypi/pypi_handler.py +251 -0
  221. aiq/registry_handlers/pypi/register_pypi.py +40 -0
  222. aiq/registry_handlers/register.py +21 -0
  223. aiq/registry_handlers/registry_handler_base.py +157 -0
  224. aiq/registry_handlers/rest/__init__.py +0 -0
  225. aiq/registry_handlers/rest/register_rest.py +56 -0
  226. aiq/registry_handlers/rest/rest_handler.py +237 -0
  227. aiq/registry_handlers/schemas/__init__.py +0 -0
  228. aiq/registry_handlers/schemas/headers.py +42 -0
  229. aiq/registry_handlers/schemas/package.py +68 -0
  230. aiq/registry_handlers/schemas/publish.py +63 -0
  231. aiq/registry_handlers/schemas/pull.py +82 -0
  232. aiq/registry_handlers/schemas/remove.py +36 -0
  233. aiq/registry_handlers/schemas/search.py +91 -0
  234. aiq/registry_handlers/schemas/status.py +47 -0
  235. aiq/retriever/__init__.py +0 -0
  236. aiq/retriever/interface.py +37 -0
  237. aiq/retriever/milvus/__init__.py +14 -0
  238. aiq/retriever/milvus/register.py +81 -0
  239. aiq/retriever/milvus/retriever.py +228 -0
  240. aiq/retriever/models.py +74 -0
  241. aiq/retriever/nemo_retriever/__init__.py +14 -0
  242. aiq/retriever/nemo_retriever/register.py +60 -0
  243. aiq/retriever/nemo_retriever/retriever.py +190 -0
  244. aiq/retriever/register.py +22 -0
  245. aiq/runtime/__init__.py +14 -0
  246. aiq/runtime/loader.py +188 -0
  247. aiq/runtime/runner.py +176 -0
  248. aiq/runtime/session.py +136 -0
  249. aiq/runtime/user_metadata.py +131 -0
  250. aiq/settings/__init__.py +0 -0
  251. aiq/settings/global_settings.py +318 -0
  252. aiq/test/.namespace +1 -0
  253. aiq/tool/__init__.py +0 -0
  254. aiq/tool/code_execution/__init__.py +0 -0
  255. aiq/tool/code_execution/code_sandbox.py +188 -0
  256. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
  257. aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
  258. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +79 -0
  259. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +4 -0
  260. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +25 -0
  261. aiq/tool/code_execution/register.py +70 -0
  262. aiq/tool/code_execution/utils.py +100 -0
  263. aiq/tool/datetime_tools.py +42 -0
  264. aiq/tool/document_search.py +141 -0
  265. aiq/tool/github_tools/__init__.py +0 -0
  266. aiq/tool/github_tools/create_github_commit.py +133 -0
  267. aiq/tool/github_tools/create_github_issue.py +87 -0
  268. aiq/tool/github_tools/create_github_pr.py +106 -0
  269. aiq/tool/github_tools/get_github_file.py +106 -0
  270. aiq/tool/github_tools/get_github_issue.py +166 -0
  271. aiq/tool/github_tools/get_github_pr.py +256 -0
  272. aiq/tool/github_tools/update_github_issue.py +100 -0
  273. aiq/tool/mcp/__init__.py +14 -0
  274. aiq/tool/mcp/mcp_client.py +220 -0
  275. aiq/tool/mcp/mcp_tool.py +76 -0
  276. aiq/tool/memory_tools/__init__.py +0 -0
  277. aiq/tool/memory_tools/add_memory_tool.py +67 -0
  278. aiq/tool/memory_tools/delete_memory_tool.py +67 -0
  279. aiq/tool/memory_tools/get_memory_tool.py +72 -0
  280. aiq/tool/nvidia_rag.py +95 -0
  281. aiq/tool/register.py +36 -0
  282. aiq/tool/retriever.py +89 -0
  283. aiq/utils/__init__.py +0 -0
  284. aiq/utils/data_models/__init__.py +0 -0
  285. aiq/utils/data_models/schema_validator.py +58 -0
  286. aiq/utils/debugging_utils.py +43 -0
  287. aiq/utils/exception_handlers/__init__.py +0 -0
  288. aiq/utils/exception_handlers/schemas.py +114 -0
  289. aiq/utils/io/__init__.py +0 -0
  290. aiq/utils/io/yaml_tools.py +119 -0
  291. aiq/utils/metadata_utils.py +74 -0
  292. aiq/utils/optional_imports.py +142 -0
  293. aiq/utils/producer_consumer_queue.py +178 -0
  294. aiq/utils/reactive/__init__.py +0 -0
  295. aiq/utils/reactive/base/__init__.py +0 -0
  296. aiq/utils/reactive/base/observable_base.py +65 -0
  297. aiq/utils/reactive/base/observer_base.py +55 -0
  298. aiq/utils/reactive/base/subject_base.py +79 -0
  299. aiq/utils/reactive/observable.py +59 -0
  300. aiq/utils/reactive/observer.py +76 -0
  301. aiq/utils/reactive/subject.py +131 -0
  302. aiq/utils/reactive/subscription.py +49 -0
  303. aiq/utils/settings/__init__.py +0 -0
  304. aiq/utils/settings/global_settings.py +197 -0
  305. aiq/utils/type_converter.py +232 -0
  306. aiq/utils/type_utils.py +397 -0
  307. aiq/utils/url_utils.py +27 -0
  308. aiqtoolkit-1.1.0a20250503.dist-info/METADATA +330 -0
  309. aiqtoolkit-1.1.0a20250503.dist-info/RECORD +314 -0
  310. aiqtoolkit-1.1.0a20250503.dist-info/WHEEL +5 -0
  311. aiqtoolkit-1.1.0a20250503.dist-info/entry_points.txt +17 -0
  312. aiqtoolkit-1.1.0a20250503.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
  313. aiqtoolkit-1.1.0a20250503.dist-info/licenses/LICENSE.md +201 -0
  314. aiqtoolkit-1.1.0a20250503.dist-info/top_level.txt +1 -0
@@ -0,0 +1,315 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import html
17
+ import logging
18
+ from functools import reduce
19
+ from textwrap import dedent
20
+
21
+ from aiq.data_models.api_server import AIQResponseIntermediateStep
22
+ from aiq.data_models.api_server import AIQResponseSerializable
23
+ from aiq.data_models.intermediate_step import IntermediateStep
24
+ from aiq.data_models.intermediate_step import IntermediateStepCategory
25
+ from aiq.data_models.intermediate_step import IntermediateStepPayload
26
+ from aiq.data_models.intermediate_step import IntermediateStepType
27
+ from aiq.data_models.invocation_node import InvocationNode
28
+ from aiq.data_models.step_adaptor import StepAdaptorConfig
29
+ from aiq.data_models.step_adaptor import StepAdaptorMode
30
+ from aiq.utils.type_utils import is_valid_json
31
+
32
+ logger = logging.getLogger(__name__)
33
+
34
+
35
+ class StepAdaptor:
36
+
37
+ def __init__(self, config: StepAdaptorConfig):
38
+
39
+ self._history: list[IntermediateStep] = []
40
+ self.config = config
41
+
42
+ def _step_matches_filter(self, step: IntermediateStep, config: StepAdaptorConfig) -> bool:
43
+ """
44
+ Returns True if this intermediate step should be included (based on the config.mode).
45
+ """
46
+
47
+ if config.mode == StepAdaptorMode.OFF:
48
+ return False
49
+
50
+ if config.mode == StepAdaptorMode.DEFAULT:
51
+ # default existing behavior: show LLM events + TOOL_END + FUNCTION events
52
+ if step.event_category == IntermediateStepCategory.LLM:
53
+ return True
54
+ if step.event_type == IntermediateStepType.TOOL_END:
55
+ return True
56
+ if step.event_type in [IntermediateStepType.FUNCTION_START, IntermediateStepType.FUNCTION_END]:
57
+ return True
58
+ return False
59
+
60
+ if config.mode == StepAdaptorMode.CUSTOM:
61
+ # pass only what the user explicitly listed
62
+ return step.event_type in config.custom_event_types
63
+
64
+ return False
65
+
66
+ def _handle_llm(self, step: IntermediateStepPayload, ancestry: InvocationNode) -> AIQResponseSerializable | None:
67
+ input_str: str | None = None
68
+ output_str: str | None = None
69
+
70
+ # Find the start in the history with matching run_id
71
+ start_step = next(
72
+ (x for x in self._history if x.event_type == IntermediateStepType.LLM_START and x.UUID == step.UUID), None)
73
+
74
+ if not start_step:
75
+ # If we don't have a start step, we can't do anything
76
+ return None
77
+
78
+ input_str = str(start_step.data.input)
79
+
80
+ if step.event_type == IntermediateStepType.LLM_NEW_TOKEN:
81
+
82
+ # Find all of the previous LLM chunks and concatenate them
83
+ output_str = reduce(
84
+ lambda x, y: x + y,
85
+ (str(x.data.chunk)
86
+ for x in self._history if x.event_type == IntermediateStepType.LLM_NEW_TOKEN and x.UUID == step.UUID),
87
+ "")
88
+
89
+ elif step.event_type == IntermediateStepType.LLM_END:
90
+ output_str = str(step.data.output)
91
+
92
+ if not input_str and not output_str:
93
+ return None
94
+
95
+ escaped_input = html.escape(input_str, quote=False)
96
+
97
+ # Dont use f-strings here because the payload is markdown and screws up the dedent
98
+ payload = dedent("""
99
+ **Input:**
100
+ ```python
101
+ {input_value}
102
+ ```
103
+ """).strip("\n").format(input_value=escaped_input)
104
+
105
+ if (output_str):
106
+ escaped_output = html.escape(output_str, quote=False) if output_str else ""
107
+
108
+ # Dont use f-strings here because the payload is markdown and screws up the dedent
109
+ payload = dedent("""
110
+ {payload}
111
+
112
+ **Output:**
113
+ {output_value}
114
+ """).strip("\n").format(payload=payload, output_value=escaped_output)
115
+
116
+ event = AIQResponseIntermediateStep(id=step.UUID,
117
+ name=step.name or "",
118
+ payload=payload,
119
+ parent_id=ancestry.function_id)
120
+
121
+ return event
122
+
123
+ def _handle_tool_end(self, payload: IntermediateStepPayload,
124
+ ancestry: InvocationNode) -> AIQResponseSerializable | None:
125
+ """
126
+ Handles the TOOL_END event
127
+ """
128
+ escaped_tool_input = html.escape(str(payload.data.input), quote=False)
129
+ escaped_tool_output = html.escape(str(payload.data.output), quote=False)
130
+
131
+ escaped_tool_input = escaped_tool_input.replace("\n", "")
132
+ escaped_tool_output = escaped_tool_output.replace("\n", "")
133
+
134
+ # Determine the format
135
+ format_input_type = "json" if is_valid_json(escaped_tool_input) else "python"
136
+ format_output_type = "json" if is_valid_json(escaped_tool_output) else "python"
137
+
138
+ # Dont use f-strings here because the payload is markdown and screws up the dedent
139
+ payload_str = dedent("""
140
+ **Input:**
141
+ ```{format_input_type}
142
+ {input_value}
143
+ ```
144
+ **Output:**
145
+ ```{format_output_type}
146
+ {output_value}
147
+ ```
148
+ """).strip("\n").format(input_value=escaped_tool_input,
149
+ output_value=escaped_tool_output,
150
+ format_input_type=format_input_type,
151
+ format_output_type=format_output_type)
152
+
153
+ event = AIQResponseIntermediateStep(id=payload.UUID,
154
+ name=f"Tool: {payload.name}",
155
+ payload=payload_str,
156
+ parent_id=ancestry.function_id)
157
+
158
+ return event
159
+
160
+ def _handle_function(self, step: IntermediateStepPayload,
161
+ ancestry: InvocationNode) -> AIQResponseSerializable | None:
162
+ """
163
+ Handles the FUNCTION_START and FUNCTION_END events
164
+ """
165
+ input_str: str | None = None
166
+ output_str: str | None = None
167
+
168
+ if step.event_type == IntermediateStepType.FUNCTION_START:
169
+ # For function start events, display input data
170
+ if step.data and hasattr(step.data, 'input'):
171
+ input_str = str(step.data.input)
172
+ elif step.data:
173
+ input_str = str(step.data)
174
+
175
+ if not input_str:
176
+ return None
177
+
178
+ escaped_input = html.escape(input_str, quote=False)
179
+ format_input_type = "json" if is_valid_json(escaped_input) else "python"
180
+
181
+ # Create payload for function start
182
+ payload_str = dedent("""
183
+ **Function Input:**
184
+ ```{format_input_type}
185
+ {input_value}
186
+ ```
187
+ """).strip("\n").format(input_value=escaped_input, format_input_type=format_input_type)
188
+
189
+ event = AIQResponseIntermediateStep(id=step.UUID,
190
+ name=f"Function Start: {step.name}",
191
+ payload=payload_str,
192
+ parent_id=ancestry.parent_id)
193
+ return event
194
+
195
+ if step.event_type == IntermediateStepType.FUNCTION_END:
196
+ # Find the start event with matching UUID
197
+ start_step = next(
198
+ (x
199
+ for x in self._history if x.event_type == IntermediateStepType.FUNCTION_START and x.UUID == step.UUID),
200
+ None)
201
+
202
+ # For function end events, display output data
203
+ if step.data and hasattr(step.data, 'output'):
204
+ output_str = str(step.data.output)
205
+ elif step.data:
206
+ output_str = str(step.data)
207
+
208
+ if not output_str:
209
+ return None
210
+
211
+ escaped_output = html.escape(output_str, quote=False)
212
+ format_output_type = "json" if is_valid_json(escaped_output) else "python"
213
+
214
+ # Get input from start step if available
215
+ input_payload = ""
216
+ if start_step and start_step.data:
217
+ if hasattr(start_step.data, 'input'):
218
+ input_str = str(start_step.data.input)
219
+ else:
220
+ input_str = str(start_step.data)
221
+
222
+ if input_str:
223
+ escaped_input = html.escape(input_str, quote=False)
224
+ format_input_type = "json" if is_valid_json(escaped_input) else "python"
225
+ input_payload = dedent("""
226
+ **Function Input:**
227
+ ```{format_input_type}
228
+ {input_value}
229
+ ```
230
+ """).strip("\n").format(input_value=escaped_input, format_input_type=format_input_type)
231
+
232
+ # Create payload for function end
233
+ payload_str = dedent("""
234
+ {input_payload}**Function Output:**
235
+ ```{format_output_type}
236
+ {output_value}
237
+ ```
238
+ """).strip("\n").format(input_payload=input_payload,
239
+ output_value=escaped_output,
240
+ format_output_type=format_output_type)
241
+
242
+ event = AIQResponseIntermediateStep(id=step.UUID,
243
+ name=f"Function Complete: {step.name}",
244
+ payload=payload_str,
245
+ parent_id=ancestry.parent_id)
246
+ return event
247
+
248
+ return None
249
+
250
+ def _handle_custom(self, payload: IntermediateStepPayload,
251
+ ancestry: InvocationNode) -> AIQResponseSerializable | None:
252
+ """
253
+ Handles the CUSTOM event
254
+ """
255
+ escaped_payload = html.escape(str(payload), quote=False)
256
+ escaped_payload = escaped_payload.replace("\n", "")
257
+
258
+ # Attempt to determine type
259
+ format_type = "json" if is_valid_json(escaped_payload) else "python"
260
+
261
+ # Don't use f-strings here because the payload is markdown and screws up the dedent
262
+ payload_str = dedent("""
263
+ ```{format_type}
264
+ {payload}
265
+ ```
266
+ """).strip("\n").format(payload=escaped_payload, format_type=format_type)
267
+
268
+ # Return the event
269
+ event = AIQResponseIntermediateStep(id=payload.UUID,
270
+ name=f"{payload.event_type}",
271
+ payload=payload_str,
272
+ parent_id=ancestry.function_id)
273
+
274
+ return event
275
+
276
+ def process(self, step: IntermediateStep) -> AIQResponseSerializable | None:
277
+ # Track the chunk
278
+ self._history.append(step)
279
+ payload = step.payload
280
+ ancestry = step.function_ancestry
281
+
282
+ if not self._step_matches_filter(step, self.config):
283
+ return None
284
+
285
+ try:
286
+
287
+ if self.config.mode == StepAdaptorMode.DEFAULT:
288
+
289
+ if step.event_category == IntermediateStepCategory.LLM:
290
+ return self._handle_llm(payload, ancestry)
291
+
292
+ if step.event_type == IntermediateStepType.TOOL_END:
293
+ return self._handle_tool_end(payload, ancestry)
294
+
295
+ if step.event_type in [IntermediateStepType.FUNCTION_START, IntermediateStepType.FUNCTION_END]:
296
+ return self._handle_function(payload, ancestry)
297
+
298
+ if self.config.mode == StepAdaptorMode.CUSTOM:
299
+ # Now we're processing user defined custom types
300
+
301
+ if step.event_category == IntermediateStepCategory.LLM:
302
+ return self._handle_llm(payload, ancestry)
303
+
304
+ if step.event_type == IntermediateStepType.TOOL_END:
305
+ return self._handle_tool_end(payload, ancestry)
306
+
307
+ if step.event_type in [IntermediateStepType.FUNCTION_START, IntermediateStepType.FUNCTION_END]:
308
+ return self._handle_function(payload, ancestry)
309
+
310
+ return self._handle_custom(payload, ancestry)
311
+
312
+ except Exception as e:
313
+ logger.error("Error processing intermediate step: %s", e, exc_info=True)
314
+
315
+ return None
@@ -0,0 +1,148 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import asyncio
17
+ import logging
18
+ import typing
19
+ from collections.abc import Awaitable
20
+ from collections.abc import Callable
21
+ from typing import Any
22
+
23
+ from fastapi import WebSocket
24
+ from fastapi import WebSocketException
25
+ from starlette.endpoints import WebSocketEndpoint
26
+ from starlette.websockets import WebSocketDisconnect
27
+
28
+ from aiq.data_models.api_server import AIQChatRequest
29
+ from aiq.data_models.api_server import AIQChatResponse
30
+ from aiq.data_models.api_server import AIQChatResponseChunk
31
+ from aiq.data_models.api_server import AIQResponsePayloadOutput
32
+ from aiq.data_models.api_server import AIQResponseSerializable
33
+ from aiq.data_models.api_server import WebSocketMessageStatus
34
+ from aiq.data_models.api_server import WorkflowSchemaType
35
+ from aiq.front_ends.fastapi.message_handler import MessageHandler
36
+ from aiq.front_ends.fastapi.response_helpers import generate_streaming_response
37
+ from aiq.front_ends.fastapi.step_adaptor import StepAdaptor
38
+ from aiq.runtime.session import AIQSessionManager
39
+
40
+ logger = logging.getLogger(__name__)
41
+
42
+
43
+ class AIQWebSocket(WebSocketEndpoint):
44
+ encoding = "json"
45
+
46
+ def __init__(self, session_manager: AIQSessionManager, step_adaptor: StepAdaptor, *args, **kwargs):
47
+ self._session_manager: AIQSessionManager = session_manager
48
+ self._message_handler: MessageHandler = MessageHandler(self)
49
+ self._process_response_event: asyncio.Event = asyncio.Event()
50
+ self._workflow_schema_type: dict[str, Callable[..., Awaitable[Any]]] = {
51
+ WorkflowSchemaType.GENERATE_STREAM: self.process_generate_stream,
52
+ WorkflowSchemaType.CHAT_STREAM: self.process_chat_stream,
53
+ WorkflowSchemaType.GENERATE: self.process_generate,
54
+ WorkflowSchemaType.CHAT: self.process_chat
55
+ }
56
+ self._step_adaptor = step_adaptor
57
+ super().__init__(*args, **kwargs)
58
+
59
+ @property
60
+ def workflow_schema_type(self) -> dict[str, Callable[..., Awaitable[Any]]]:
61
+ return self._workflow_schema_type
62
+
63
+ @property
64
+ def process_response_event(self) -> asyncio.Event:
65
+ return self._process_response_event
66
+
67
+ async def on_connect(self, websocket: WebSocket):
68
+ try:
69
+ # Accept the websocket connection
70
+ await websocket.accept()
71
+ try:
72
+ # Start background message processors
73
+ self._message_handler.process_messages_task = asyncio.create_task(
74
+ self._message_handler.process_messages())
75
+
76
+ self._message_handler.process_out_going_messages_task = asyncio.create_task(
77
+ self._message_handler.process_out_going_messages(websocket))
78
+
79
+ except asyncio.CancelledError:
80
+ pass
81
+
82
+ except (WebSocketDisconnect, WebSocketException):
83
+ logger.error("A WebSocket error occured during `on_connect`. Ignoring the connection.", exc_info=True)
84
+
85
+ async def on_send(self, websocket: WebSocket, data: dict[str, str]):
86
+ try:
87
+ await websocket.send_json(data)
88
+ except (WebSocketDisconnect, WebSocketException, Exception):
89
+ logger.error("A WebSocket error occurred during `on_send`. Ignoring the connection.", exc_info=True)
90
+
91
+ async def on_receive(self, websocket: WebSocket, data: dict[str, Any]):
92
+ try:
93
+ await self._message_handler.messages_queue.put(data)
94
+ except (Exception):
95
+ logger.error("An unxpected error occurred during `on_receive`. Ignoring the exception", exc_info=True)
96
+
97
+ async def on_disconnect(self, websocket: WebSocket, close_code: Any):
98
+ try:
99
+ if self._message_handler.process_messages_task:
100
+ self._message_handler.process_messages_task.cancel()
101
+
102
+ if self._message_handler.process_out_going_messages_task:
103
+ self._message_handler.process_out_going_messages_task.cancel()
104
+
105
+ if self._message_handler.background_task:
106
+ self._message_handler.background_task.cancel()
107
+
108
+ except (WebSocketDisconnect, asyncio.CancelledError):
109
+ pass
110
+
111
+ async def _process_message(self,
112
+ payload: typing.Any,
113
+ result_type: type | None = None,
114
+ output_type: type | None = None) -> None:
115
+
116
+ async with self._session_manager.session(
117
+ user_input_callback=self._message_handler.human_interaction) as session:
118
+
119
+ async for value in generate_streaming_response(payload,
120
+ session_manager=session,
121
+ streaming=True,
122
+ step_adaptor=self._step_adaptor,
123
+ result_type=result_type,
124
+ output_type=output_type):
125
+
126
+ await self._process_response_event.wait()
127
+
128
+ if not isinstance(value, AIQResponseSerializable):
129
+ value = AIQResponsePayloadOutput(payload=value)
130
+
131
+ await self._message_handler.create_websocket_message(data_model=value,
132
+ status=WebSocketMessageStatus.IN_PROGRESS)
133
+
134
+ async def process_generate_stream(self, payload: str):
135
+
136
+ return await self._process_message(payload, result_type=None, output_type=None)
137
+
138
+ async def process_chat_stream(self, payload: AIQChatRequest):
139
+
140
+ return await self._process_message(payload, result_type=AIQChatResponse, output_type=AIQChatResponseChunk)
141
+
142
+ async def process_generate(self, payload: typing.Any):
143
+
144
+ return await self._process_message(payload)
145
+
146
+ async def process_chat(self, payload: AIQChatRequest):
147
+
148
+ return await self._process_message(payload, result_type=AIQChatResponse)
@@ -0,0 +1,14 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
@@ -0,0 +1,32 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from pydantic import Field
17
+
18
+ from aiq.data_models.front_end import FrontEndBaseConfig
19
+
20
+
21
+ class MCPFrontEndConfig(FrontEndBaseConfig, name="mcp"):
22
+ """MCP front end configuration.
23
+
24
+ A simple MCP (Modular Communication Protocol) front end for AIQ.
25
+ """
26
+
27
+ name: str = Field(default="AIQ MCP", description="Name of the MCP server")
28
+ host: str = Field(default="localhost", description="Host to bind the server to")
29
+ port: int = Field(default=9901, description="Port to bind the server to", ge=0, le=65535)
30
+ debug: bool = Field(default=False, description="Enable debug mode")
31
+ log_level: str = Field(default="INFO", description="Log level for the MCP server")
32
+ tool_names: list[str] = Field(default_factory=list, description="The list of tools MCP server will expose.")
@@ -0,0 +1,93 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import logging
17
+
18
+ from aiq.builder.front_end import FrontEndBase
19
+ from aiq.builder.function import Function
20
+ from aiq.builder.workflow import Workflow
21
+ from aiq.builder.workflow_builder import WorkflowBuilder
22
+ from aiq.front_ends.mcp.mcp_front_end_config import MCPFrontEndConfig
23
+
24
+ logger = logging.getLogger(__name__)
25
+
26
+
27
+ class MCPFrontEndPlugin(FrontEndBase[MCPFrontEndConfig]):
28
+ """MCP front end plugin implementation."""
29
+
30
+ async def run(self) -> None:
31
+ """Run the MCP server."""
32
+ # Import FastMCP
33
+ from mcp.server.fastmcp import FastMCP
34
+
35
+ from aiq.front_ends.mcp.tool_converter import register_function_with_mcp
36
+
37
+ # Create an MCP server with the configured parameters
38
+ mcp = FastMCP(
39
+ self.front_end_config.name,
40
+ host=self.front_end_config.host,
41
+ port=self.front_end_config.port,
42
+ debug=self.front_end_config.debug,
43
+ log_level=self.front_end_config.log_level,
44
+ )
45
+
46
+ # Build the workflow and register all functions with MCP
47
+ async with WorkflowBuilder.from_config(config=self.full_config) as builder:
48
+ # Build the workflow
49
+ workflow = builder.build()
50
+
51
+ # Get all functions from the workflow
52
+ functions = self._get_all_functions(workflow)
53
+
54
+ # Filter functions based on tool_names if provided
55
+ if self.front_end_config.tool_names:
56
+ logger.info(f"Filtering functions based on tool_names: {self.front_end_config.tool_names}")
57
+ filtered_functions: dict[str, Function] = {}
58
+ for function_name, function in functions.items():
59
+ if function_name in self.front_end_config.tool_names:
60
+ filtered_functions[function_name] = function
61
+ else:
62
+ logger.debug(f"Skipping function {function_name} as it's not in tool_names")
63
+ functions = filtered_functions
64
+
65
+ # Register each function with MCP
66
+ for function_name, function in functions.items():
67
+ register_function_with_mcp(mcp, function_name, function)
68
+
69
+ # Add a simple fallback function if no functions were found
70
+ if not functions:
71
+ raise RuntimeError("No functions found in workflow. Please check your configuration.")
72
+
73
+ # Start the MCP server
74
+ await mcp.run_sse_async()
75
+
76
+ def _get_all_functions(self, workflow: Workflow) -> dict[str, Function]:
77
+ """Get all functions from the workflow.
78
+
79
+ Args:
80
+ workflow: The AIQ workflow.
81
+
82
+ Returns:
83
+ Dict mapping function names to Function objects.
84
+ """
85
+ functions: dict[str, Function] = {}
86
+
87
+ # Extract all functions from the workflow
88
+ for function_name, function in workflow.functions.items():
89
+ functions[function_name] = function
90
+
91
+ functions[workflow.config.workflow.type] = workflow
92
+
93
+ return functions
@@ -0,0 +1,27 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from collections.abc import AsyncIterator
17
+
18
+ from aiq.cli.register_workflow import register_front_end
19
+ from aiq.data_models.config import AIQConfig
20
+ from aiq.front_ends.mcp.mcp_front_end_config import MCPFrontEndConfig
21
+
22
+
23
+ @register_front_end(config_type=MCPFrontEndConfig)
24
+ async def register_mcp_front_end(config: MCPFrontEndConfig, full_config: AIQConfig) -> AsyncIterator:
25
+ from aiq.front_ends.mcp.mcp_front_end_plugin import MCPFrontEndPlugin
26
+
27
+ yield MCPFrontEndPlugin(full_config=full_config)