aiqtoolkit 1.1.0a20250429__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (309) hide show
  1. aiq/agent/__init__.py +0 -0
  2. aiq/agent/base.py +76 -0
  3. aiq/agent/dual_node.py +67 -0
  4. aiq/agent/react_agent/__init__.py +0 -0
  5. aiq/agent/react_agent/agent.py +322 -0
  6. aiq/agent/react_agent/output_parser.py +104 -0
  7. aiq/agent/react_agent/prompt.py +46 -0
  8. aiq/agent/react_agent/register.py +148 -0
  9. aiq/agent/reasoning_agent/__init__.py +0 -0
  10. aiq/agent/reasoning_agent/reasoning_agent.py +224 -0
  11. aiq/agent/register.py +23 -0
  12. aiq/agent/rewoo_agent/__init__.py +0 -0
  13. aiq/agent/rewoo_agent/agent.py +410 -0
  14. aiq/agent/rewoo_agent/prompt.py +108 -0
  15. aiq/agent/rewoo_agent/register.py +158 -0
  16. aiq/agent/tool_calling_agent/__init__.py +0 -0
  17. aiq/agent/tool_calling_agent/agent.py +123 -0
  18. aiq/agent/tool_calling_agent/register.py +105 -0
  19. aiq/builder/__init__.py +0 -0
  20. aiq/builder/builder.py +223 -0
  21. aiq/builder/component_utils.py +303 -0
  22. aiq/builder/context.py +198 -0
  23. aiq/builder/embedder.py +24 -0
  24. aiq/builder/eval_builder.py +116 -0
  25. aiq/builder/evaluator.py +29 -0
  26. aiq/builder/framework_enum.py +24 -0
  27. aiq/builder/front_end.py +73 -0
  28. aiq/builder/function.py +297 -0
  29. aiq/builder/function_base.py +372 -0
  30. aiq/builder/function_info.py +627 -0
  31. aiq/builder/intermediate_step_manager.py +125 -0
  32. aiq/builder/llm.py +25 -0
  33. aiq/builder/retriever.py +25 -0
  34. aiq/builder/user_interaction_manager.py +71 -0
  35. aiq/builder/workflow.py +134 -0
  36. aiq/builder/workflow_builder.py +733 -0
  37. aiq/cli/__init__.py +14 -0
  38. aiq/cli/cli_utils/__init__.py +0 -0
  39. aiq/cli/cli_utils/config_override.py +233 -0
  40. aiq/cli/cli_utils/validation.py +37 -0
  41. aiq/cli/commands/__init__.py +0 -0
  42. aiq/cli/commands/configure/__init__.py +0 -0
  43. aiq/cli/commands/configure/channel/__init__.py +0 -0
  44. aiq/cli/commands/configure/channel/add.py +28 -0
  45. aiq/cli/commands/configure/channel/channel.py +34 -0
  46. aiq/cli/commands/configure/channel/remove.py +30 -0
  47. aiq/cli/commands/configure/channel/update.py +30 -0
  48. aiq/cli/commands/configure/configure.py +33 -0
  49. aiq/cli/commands/evaluate.py +139 -0
  50. aiq/cli/commands/info/__init__.py +14 -0
  51. aiq/cli/commands/info/info.py +37 -0
  52. aiq/cli/commands/info/list_channels.py +32 -0
  53. aiq/cli/commands/info/list_components.py +129 -0
  54. aiq/cli/commands/registry/__init__.py +14 -0
  55. aiq/cli/commands/registry/publish.py +88 -0
  56. aiq/cli/commands/registry/pull.py +118 -0
  57. aiq/cli/commands/registry/registry.py +36 -0
  58. aiq/cli/commands/registry/remove.py +108 -0
  59. aiq/cli/commands/registry/search.py +155 -0
  60. aiq/cli/commands/start.py +250 -0
  61. aiq/cli/commands/uninstall.py +83 -0
  62. aiq/cli/commands/validate.py +47 -0
  63. aiq/cli/commands/workflow/__init__.py +14 -0
  64. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  65. aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
  66. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
  67. aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
  68. aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
  69. aiq/cli/commands/workflow/workflow.py +37 -0
  70. aiq/cli/commands/workflow/workflow_commands.py +307 -0
  71. aiq/cli/entrypoint.py +133 -0
  72. aiq/cli/main.py +44 -0
  73. aiq/cli/register_workflow.py +408 -0
  74. aiq/cli/type_registry.py +869 -0
  75. aiq/data_models/__init__.py +14 -0
  76. aiq/data_models/api_server.py +550 -0
  77. aiq/data_models/common.py +143 -0
  78. aiq/data_models/component.py +46 -0
  79. aiq/data_models/component_ref.py +135 -0
  80. aiq/data_models/config.py +349 -0
  81. aiq/data_models/dataset_handler.py +122 -0
  82. aiq/data_models/discovery_metadata.py +269 -0
  83. aiq/data_models/embedder.py +26 -0
  84. aiq/data_models/evaluate.py +101 -0
  85. aiq/data_models/evaluator.py +26 -0
  86. aiq/data_models/front_end.py +26 -0
  87. aiq/data_models/function.py +30 -0
  88. aiq/data_models/function_dependencies.py +64 -0
  89. aiq/data_models/interactive.py +237 -0
  90. aiq/data_models/intermediate_step.py +269 -0
  91. aiq/data_models/invocation_node.py +38 -0
  92. aiq/data_models/llm.py +26 -0
  93. aiq/data_models/logging.py +26 -0
  94. aiq/data_models/memory.py +26 -0
  95. aiq/data_models/profiler.py +53 -0
  96. aiq/data_models/registry_handler.py +26 -0
  97. aiq/data_models/retriever.py +30 -0
  98. aiq/data_models/step_adaptor.py +64 -0
  99. aiq/data_models/streaming.py +33 -0
  100. aiq/data_models/swe_bench_model.py +54 -0
  101. aiq/data_models/telemetry_exporter.py +26 -0
  102. aiq/embedder/__init__.py +0 -0
  103. aiq/embedder/langchain_client.py +41 -0
  104. aiq/embedder/nim_embedder.py +58 -0
  105. aiq/embedder/openai_embedder.py +42 -0
  106. aiq/embedder/register.py +24 -0
  107. aiq/eval/__init__.py +14 -0
  108. aiq/eval/config.py +42 -0
  109. aiq/eval/dataset_handler/__init__.py +0 -0
  110. aiq/eval/dataset_handler/dataset_downloader.py +106 -0
  111. aiq/eval/dataset_handler/dataset_filter.py +52 -0
  112. aiq/eval/dataset_handler/dataset_handler.py +164 -0
  113. aiq/eval/evaluate.py +322 -0
  114. aiq/eval/evaluator/__init__.py +14 -0
  115. aiq/eval/evaluator/evaluator_model.py +44 -0
  116. aiq/eval/intermediate_step_adapter.py +93 -0
  117. aiq/eval/rag_evaluator/__init__.py +0 -0
  118. aiq/eval/rag_evaluator/evaluate.py +138 -0
  119. aiq/eval/rag_evaluator/register.py +138 -0
  120. aiq/eval/register.py +22 -0
  121. aiq/eval/remote_workflow.py +128 -0
  122. aiq/eval/runtime_event_subscriber.py +52 -0
  123. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  124. aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
  125. aiq/eval/swe_bench_evaluator/register.py +36 -0
  126. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  127. aiq/eval/trajectory_evaluator/evaluate.py +118 -0
  128. aiq/eval/trajectory_evaluator/register.py +40 -0
  129. aiq/eval/utils/__init__.py +0 -0
  130. aiq/eval/utils/output_uploader.py +131 -0
  131. aiq/eval/utils/tqdm_position_registry.py +40 -0
  132. aiq/front_ends/__init__.py +14 -0
  133. aiq/front_ends/console/__init__.py +14 -0
  134. aiq/front_ends/console/console_front_end_config.py +32 -0
  135. aiq/front_ends/console/console_front_end_plugin.py +107 -0
  136. aiq/front_ends/console/register.py +25 -0
  137. aiq/front_ends/cron/__init__.py +14 -0
  138. aiq/front_ends/fastapi/__init__.py +14 -0
  139. aiq/front_ends/fastapi/fastapi_front_end_config.py +150 -0
  140. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +103 -0
  141. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +574 -0
  142. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
  143. aiq/front_ends/fastapi/job_store.py +161 -0
  144. aiq/front_ends/fastapi/main.py +70 -0
  145. aiq/front_ends/fastapi/message_handler.py +279 -0
  146. aiq/front_ends/fastapi/message_validator.py +345 -0
  147. aiq/front_ends/fastapi/register.py +25 -0
  148. aiq/front_ends/fastapi/response_helpers.py +181 -0
  149. aiq/front_ends/fastapi/step_adaptor.py +315 -0
  150. aiq/front_ends/fastapi/websocket.py +148 -0
  151. aiq/front_ends/mcp/__init__.py +14 -0
  152. aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
  153. aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
  154. aiq/front_ends/mcp/register.py +27 -0
  155. aiq/front_ends/mcp/tool_converter.py +242 -0
  156. aiq/front_ends/register.py +22 -0
  157. aiq/front_ends/simple_base/__init__.py +14 -0
  158. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +52 -0
  159. aiq/llm/__init__.py +0 -0
  160. aiq/llm/nim_llm.py +45 -0
  161. aiq/llm/openai_llm.py +45 -0
  162. aiq/llm/register.py +22 -0
  163. aiq/llm/utils/__init__.py +14 -0
  164. aiq/llm/utils/env_config_value.py +94 -0
  165. aiq/llm/utils/error.py +17 -0
  166. aiq/memory/__init__.py +20 -0
  167. aiq/memory/interfaces.py +183 -0
  168. aiq/memory/models.py +102 -0
  169. aiq/meta/module_to_distro.json +3 -0
  170. aiq/meta/pypi.md +59 -0
  171. aiq/observability/__init__.py +0 -0
  172. aiq/observability/async_otel_listener.py +270 -0
  173. aiq/observability/register.py +97 -0
  174. aiq/plugins/.namespace +1 -0
  175. aiq/profiler/__init__.py +0 -0
  176. aiq/profiler/callbacks/__init__.py +0 -0
  177. aiq/profiler/callbacks/agno_callback_handler.py +295 -0
  178. aiq/profiler/callbacks/base_callback_class.py +20 -0
  179. aiq/profiler/callbacks/langchain_callback_handler.py +278 -0
  180. aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
  181. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
  182. aiq/profiler/callbacks/token_usage_base_model.py +27 -0
  183. aiq/profiler/data_frame_row.py +51 -0
  184. aiq/profiler/decorators/__init__.py +0 -0
  185. aiq/profiler/decorators/framework_wrapper.py +131 -0
  186. aiq/profiler/decorators/function_tracking.py +254 -0
  187. aiq/profiler/forecasting/__init__.py +0 -0
  188. aiq/profiler/forecasting/config.py +18 -0
  189. aiq/profiler/forecasting/model_trainer.py +75 -0
  190. aiq/profiler/forecasting/models/__init__.py +22 -0
  191. aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
  192. aiq/profiler/forecasting/models/linear_model.py +196 -0
  193. aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
  194. aiq/profiler/inference_metrics_model.py +25 -0
  195. aiq/profiler/inference_optimization/__init__.py +0 -0
  196. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  197. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +452 -0
  198. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
  199. aiq/profiler/inference_optimization/data_models.py +386 -0
  200. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  201. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
  202. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
  203. aiq/profiler/inference_optimization/llm_metrics.py +212 -0
  204. aiq/profiler/inference_optimization/prompt_caching.py +163 -0
  205. aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
  206. aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
  207. aiq/profiler/intermediate_property_adapter.py +102 -0
  208. aiq/profiler/profile_runner.py +433 -0
  209. aiq/profiler/utils.py +184 -0
  210. aiq/registry_handlers/__init__.py +0 -0
  211. aiq/registry_handlers/local/__init__.py +0 -0
  212. aiq/registry_handlers/local/local_handler.py +176 -0
  213. aiq/registry_handlers/local/register_local.py +37 -0
  214. aiq/registry_handlers/metadata_factory.py +60 -0
  215. aiq/registry_handlers/package_utils.py +198 -0
  216. aiq/registry_handlers/pypi/__init__.py +0 -0
  217. aiq/registry_handlers/pypi/pypi_handler.py +251 -0
  218. aiq/registry_handlers/pypi/register_pypi.py +40 -0
  219. aiq/registry_handlers/register.py +21 -0
  220. aiq/registry_handlers/registry_handler_base.py +157 -0
  221. aiq/registry_handlers/rest/__init__.py +0 -0
  222. aiq/registry_handlers/rest/register_rest.py +56 -0
  223. aiq/registry_handlers/rest/rest_handler.py +237 -0
  224. aiq/registry_handlers/schemas/__init__.py +0 -0
  225. aiq/registry_handlers/schemas/headers.py +42 -0
  226. aiq/registry_handlers/schemas/package.py +68 -0
  227. aiq/registry_handlers/schemas/publish.py +63 -0
  228. aiq/registry_handlers/schemas/pull.py +81 -0
  229. aiq/registry_handlers/schemas/remove.py +36 -0
  230. aiq/registry_handlers/schemas/search.py +91 -0
  231. aiq/registry_handlers/schemas/status.py +47 -0
  232. aiq/retriever/__init__.py +0 -0
  233. aiq/retriever/interface.py +37 -0
  234. aiq/retriever/milvus/__init__.py +14 -0
  235. aiq/retriever/milvus/register.py +81 -0
  236. aiq/retriever/milvus/retriever.py +228 -0
  237. aiq/retriever/models.py +74 -0
  238. aiq/retriever/nemo_retriever/__init__.py +14 -0
  239. aiq/retriever/nemo_retriever/register.py +60 -0
  240. aiq/retriever/nemo_retriever/retriever.py +190 -0
  241. aiq/retriever/register.py +22 -0
  242. aiq/runtime/__init__.py +14 -0
  243. aiq/runtime/loader.py +188 -0
  244. aiq/runtime/runner.py +176 -0
  245. aiq/runtime/session.py +116 -0
  246. aiq/settings/__init__.py +0 -0
  247. aiq/settings/global_settings.py +318 -0
  248. aiq/test/.namespace +1 -0
  249. aiq/tool/__init__.py +0 -0
  250. aiq/tool/code_execution/__init__.py +0 -0
  251. aiq/tool/code_execution/code_sandbox.py +188 -0
  252. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
  253. aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
  254. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +79 -0
  255. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +4 -0
  256. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +25 -0
  257. aiq/tool/code_execution/register.py +70 -0
  258. aiq/tool/code_execution/utils.py +100 -0
  259. aiq/tool/datetime_tools.py +42 -0
  260. aiq/tool/document_search.py +141 -0
  261. aiq/tool/github_tools/__init__.py +0 -0
  262. aiq/tool/github_tools/create_github_commit.py +133 -0
  263. aiq/tool/github_tools/create_github_issue.py +87 -0
  264. aiq/tool/github_tools/create_github_pr.py +106 -0
  265. aiq/tool/github_tools/get_github_file.py +106 -0
  266. aiq/tool/github_tools/get_github_issue.py +166 -0
  267. aiq/tool/github_tools/get_github_pr.py +256 -0
  268. aiq/tool/github_tools/update_github_issue.py +100 -0
  269. aiq/tool/mcp/__init__.py +14 -0
  270. aiq/tool/mcp/mcp_client.py +220 -0
  271. aiq/tool/mcp/mcp_tool.py +75 -0
  272. aiq/tool/memory_tools/__init__.py +0 -0
  273. aiq/tool/memory_tools/add_memory_tool.py +67 -0
  274. aiq/tool/memory_tools/delete_memory_tool.py +67 -0
  275. aiq/tool/memory_tools/get_memory_tool.py +72 -0
  276. aiq/tool/nvidia_rag.py +95 -0
  277. aiq/tool/register.py +36 -0
  278. aiq/tool/retriever.py +89 -0
  279. aiq/utils/__init__.py +0 -0
  280. aiq/utils/data_models/__init__.py +0 -0
  281. aiq/utils/data_models/schema_validator.py +58 -0
  282. aiq/utils/debugging_utils.py +43 -0
  283. aiq/utils/exception_handlers/__init__.py +0 -0
  284. aiq/utils/exception_handlers/schemas.py +114 -0
  285. aiq/utils/io/__init__.py +0 -0
  286. aiq/utils/io/yaml_tools.py +50 -0
  287. aiq/utils/metadata_utils.py +74 -0
  288. aiq/utils/producer_consumer_queue.py +178 -0
  289. aiq/utils/reactive/__init__.py +0 -0
  290. aiq/utils/reactive/base/__init__.py +0 -0
  291. aiq/utils/reactive/base/observable_base.py +65 -0
  292. aiq/utils/reactive/base/observer_base.py +55 -0
  293. aiq/utils/reactive/base/subject_base.py +79 -0
  294. aiq/utils/reactive/observable.py +59 -0
  295. aiq/utils/reactive/observer.py +76 -0
  296. aiq/utils/reactive/subject.py +131 -0
  297. aiq/utils/reactive/subscription.py +49 -0
  298. aiq/utils/settings/__init__.py +0 -0
  299. aiq/utils/settings/global_settings.py +197 -0
  300. aiq/utils/type_converter.py +232 -0
  301. aiq/utils/type_utils.py +397 -0
  302. aiq/utils/url_utils.py +27 -0
  303. aiqtoolkit-1.1.0a20250429.dist-info/METADATA +326 -0
  304. aiqtoolkit-1.1.0a20250429.dist-info/RECORD +309 -0
  305. aiqtoolkit-1.1.0a20250429.dist-info/WHEEL +5 -0
  306. aiqtoolkit-1.1.0a20250429.dist-info/entry_points.txt +17 -0
  307. aiqtoolkit-1.1.0a20250429.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
  308. aiqtoolkit-1.1.0a20250429.dist-info/licenses/LICENSE.md +201 -0
  309. aiqtoolkit-1.1.0a20250429.dist-info/top_level.txt +1 -0
@@ -0,0 +1,183 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from abc import ABC
17
+ from abc import abstractmethod
18
+ from collections.abc import Callable
19
+
20
+ from .models import MemoryItem
21
+
22
+
23
+ class MemoryEditor(ABC):
24
+ """
25
+ Abstract interface for editing and
26
+ retrieving memory items.
27
+
28
+ A MemoryEditor is responsible for adding, searching, and
29
+ removing MemoryItems.
30
+
31
+ Implementations may integrate with
32
+ vector stores or other indexing backends.
33
+ """
34
+
35
+ @abstractmethod
36
+ async def add_items(self, items: list[MemoryItem]) -> None:
37
+ """
38
+ Insert multiple MemoryItems into the memory.
39
+
40
+ Args:
41
+ items (list[MemoryItem]): The items to be added.
42
+ """
43
+ raise NotImplementedError
44
+
45
+ @abstractmethod
46
+ async def search(self, query: str, top_k: int = 5, **kwargs) -> list[MemoryItem]:
47
+ """
48
+ Retrieve items relevant to the given query.
49
+ Relevance criteria depend on implementation.
50
+
51
+ Args:
52
+ query (str): The query string to match.
53
+ top_k (int): Maximum number of items to return.
54
+ kwargs (dict): Keyword arguments to pass to the search method.
55
+
56
+ Returns:
57
+ list[MemoryItem]: The most relevant MemoryItems.
58
+ """
59
+ raise NotImplementedError
60
+
61
+ @abstractmethod
62
+ async def remove_items(self, **kwargs) -> None:
63
+ """
64
+ Remove items. Additional parameters
65
+ needed for deletion can be specified in keyword arguments.
66
+
67
+ Args:
68
+ kwargs (dict): Keyword arguments to pass to the remove-items method.
69
+ """
70
+ raise NotImplementedError
71
+
72
+
73
+ class MemoryIOBase(ABC):
74
+ """
75
+ Base abstract class for I/O operations
76
+ on memory, providing a common interface for
77
+
78
+ MemoryReader and MemoryWriter to interact
79
+ with a MemoryEditor.
80
+
81
+ Concrete subclasses should hold a
82
+ reference to a MemoryEditor instance.
83
+ """
84
+
85
+ def __init__(self, editor: MemoryEditor) -> None:
86
+ self._editor = editor
87
+
88
+
89
+ class MemoryReader(MemoryIOBase):
90
+ """
91
+ Responsible for retrieving MemoryItems
92
+ from the MemoryEditor based on context or queries.
93
+ """
94
+
95
+ @abstractmethod
96
+ async def retrieve(self, context: str, top_k: int = 5) -> list[MemoryItem]:
97
+ """
98
+ Retrieve a subset of
99
+ MemoryItems relevant to the provided context.
100
+
101
+ Args:
102
+ context (str): A string representing
103
+ the current user context or query.
104
+ top_k (int): Maximum number of items to return.
105
+
106
+ Returns:
107
+ list[MemoryItem]: Relevant MemoryItems.
108
+ """
109
+ raise NotImplementedError
110
+
111
+
112
+ class MemoryWriter(MemoryIOBase):
113
+ """
114
+ Responsible for converting new observations
115
+ (textual inputs) into MemoryItems andstoring
116
+ them via the MemoryEditor.
117
+ """
118
+
119
+ @abstractmethod
120
+ async def write(self, observation: str, context: str | None = None) -> list[MemoryItem]:
121
+ """
122
+ Process the given observation and store the resulting MemoryItems.
123
+
124
+ Args:
125
+ observation (str): The new textual input to record.
126
+ context (Optional[str]): Additional
127
+ context that might influence how the observation is stored.
128
+
129
+ Returns:
130
+ list[MemoryItem]: The newly created MemoryItems.
131
+ """
132
+ raise NotImplementedError
133
+
134
+
135
+ class MemoryManager(ABC):
136
+ """
137
+ Manages the lifecycle of the stored
138
+ memory by applying policies such as summarization,
139
+ reflection, forgetting, and mergingn
140
+ to ensure long-term coherence and relevance.
141
+ """
142
+
143
+ @abstractmethod
144
+ async def summarize(self) -> None:
145
+ """
146
+ Summarize long or numerous MemoryItems into a more compact form.
147
+ This may remove the original items and store a new summary item.
148
+ """
149
+ raise NotImplementedError
150
+
151
+ @abstractmethod
152
+ async def reflect(self) -> None:
153
+ """
154
+ Generate higher-level insights or
155
+ abstractions from existing MemoryItems.
156
+ This may call out to an LLM or other
157
+ logic to produce conceptual memory.
158
+ """
159
+ raise NotImplementedError
160
+
161
+ @abstractmethod
162
+ async def forget(self, criteria: Callable[[MemoryItem], bool]) -> None:
163
+ """
164
+ Remove MemoryItems that are no
165
+ longer relevant or have low importance.
166
+
167
+ Args:
168
+ criteria (Callable[[MemoryItem], bool]): A function that
169
+ returns True for items to forget.
170
+ """
171
+ raise NotImplementedError
172
+
173
+ @abstractmethod
174
+ async def merge(self, criteria: Callable[[MemoryItem, MemoryItem], bool]) -> None:
175
+ """
176
+ Merge similar or redundant MemoryItems
177
+ into a smaller set of more concise items.
178
+
179
+ Args:
180
+ criteria (Callable[[MemoryItem, MemoryItem], bool]): A function
181
+ that determines which items can be merged.
182
+ """
183
+ raise NotImplementedError
aiq/memory/models.py ADDED
@@ -0,0 +1,102 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import typing
17
+
18
+ from pydantic import BaseModel
19
+ from pydantic import ConfigDict
20
+ from pydantic import Field
21
+
22
+
23
+ class MemoryItem(BaseModel):
24
+ """
25
+ Represents a single memory item consisting of structured content and associated metadata.
26
+
27
+ Attributes
28
+ ----------
29
+ conversation : list[dict[str, str]]
30
+ A list of dictionaries, each containing string key-value pairs.
31
+ user_id : str
32
+ Unique identifier for this MemoryItem's user.
33
+ tags : list[str]
34
+ A list of strings representing tags attached to the item.
35
+ metadata : dict[str, typing.Any]
36
+ Metadata providing context and utility for management operations.
37
+ memory : str or None
38
+ Optional memory string. Helpful when returning a memory.
39
+ """
40
+ model_config = ConfigDict(
41
+ # Add an example for the schema
42
+ json_schema_extra={
43
+ "examples": [{
44
+ "conversation": [
45
+ {
46
+ "role": "user",
47
+ "content": "Hi, I'm Alex. I'm a vegetarian and I'm allergic to nuts.",
48
+ },
49
+ {
50
+ "role": "assistant",
51
+ "content": "Hello Alex! I've noted that you're a vegetarian and have a nut allergy.",
52
+ },
53
+ ],
54
+ "user_id": "user_abc",
55
+ "metadata": {
56
+ "key_value_pairs": {
57
+ "type": "technology", "relevance": "high"
58
+ }
59
+ }
60
+ }]
61
+ },
62
+ # Allow population of models from arbitrary types (e.g., ORM objects)
63
+ arbitrary_types_allowed=True,
64
+ # Enable aliasing if needed
65
+ populate_by_name=True)
66
+
67
+ conversation: list[dict[str, str]] = Field(description="List of conversation messages. "
68
+ "Each message must have a \"role\" "
69
+ "key (user or assistant. It must "
70
+ "als have a \"content\" key.")
71
+ tags: list[str] = Field(default_factory=list, description="List of tags applied to the item.")
72
+ metadata: dict[str, typing.Any] = Field(description="Metadata about the memory item.")
73
+ user_id: str = Field(description="The user's ID.")
74
+ memory: str | None = Field(default=None)
75
+
76
+
77
+ class SearchMemoryInput(BaseModel):
78
+ """
79
+ Represents a search memory input structure.
80
+ """
81
+ model_config = ConfigDict(json_schema_extra={
82
+ "example": {
83
+ "query": "What is the user's preferred programming language?",
84
+ "top_k": 1,
85
+ "user_id": "user_abc",
86
+ }
87
+ })
88
+
89
+ query: str = Field(description="Search query for which to retrieve memory.") # noqa: E501
90
+ top_k: int = Field(description="Maximum number of memories to return")
91
+ user_id: str = Field(description="ID of the user to search for.")
92
+
93
+
94
+ class DeleteMemoryInput(BaseModel):
95
+ """
96
+ Represents a delete memory input structure.
97
+ """
98
+ model_config = ConfigDict(json_schema_extra={"example": {"user_id": "user_abc", }})
99
+
100
+ user_id: str = Field(description="ID of the user to delete memory for. Careful when using "
101
+ "this tool; make sure you use the "
102
+ "username present in the conversation.")
@@ -0,0 +1,3 @@
1
+ {
2
+ "aiq": "aiqtoolkit"
3
+ }
aiq/meta/pypi.md ADDED
@@ -0,0 +1,59 @@
1
+ <!--
2
+ SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
3
+ SPDX-License-Identifier: Apache-2.0
4
+
5
+ Licensed under the Apache License, Version 2.0 (the "License");
6
+ you may not use this file except in compliance with the License.
7
+ You may obtain a copy of the License at
8
+
9
+ http:/www.apache.org/licenses/LICENSE-2.0
10
+
11
+ Unless required by applicable law or agreed to in writing, software
12
+ distributed under the License is distributed on an "AS IS" BASIS,
13
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ See the License for the specific language governing permissions and
15
+ limitations under the License.
16
+ -->
17
+
18
+ ![NVIDIA AgentIQ](https://media.githubusercontent.com/media/NVIDIA/AgentIQ/refs/heads/main/docs/source/_static/agentiq_banner.png "AgentIQ banner image")
19
+
20
+ # NVIDIA AgentIQ
21
+
22
+ AgentIQ is a flexible library designed to seamlessly integrate your enterprise agents—regardless of framework—with various data sources and tools. By treating agents, tools, and agentic workflows as simple function calls, AgentIQ enables true composability: build once and reuse anywhere.
23
+
24
+ ## Key Features
25
+
26
+ - [**Framework Agnostic:**](https://docs.nvidia.com/agentiq/latest/concepts/plugins.html) Works with any agentic framework, so you can use your current technology stack without replatforming.
27
+ - [**Reusability:**](https://docs.nvidia.com/agentiq/latest/guides/sharing-workflows-and-tools.html) Every agent, tool, or workflow can be combined and repurposed, allowing developers to leverage existing work in new scenarios.
28
+ - [**Rapid Development:**](https://docs.nvidia.com/agentiq/latest/guides/create-customize-workflows.html) Start with a pre-built agent, tool, or workflow, and customize it to your needs.
29
+ - [**Profiling:**](https://docs.nvidia.com/agentiq/latest/guides/profiler.html) Profile entire workflows down to the tool and agent level, track input/output tokens and timings, and identify bottlenecks.
30
+ - [**Observability:**](https://docs.nvidia.com/agentiq/latest/guides/observe-workflow-with-phoenix.html) Monitor and debug your workflows with any OpenTelemetry-compatible observability tool.
31
+ - [**Evaluation System:**](https://docs.nvidia.com/agentiq/latest/guides/evaluate.html) Validate and maintain accuracy of agentic workflows with built-in evaluation tools.
32
+ - [**User Interface:**](https://docs.nvidia.com/agentiq/latest/guides/using-agentiq-ui-and-server.html) Use the AgentIQ UI chat interface to interact with your agents, visualize output, and debug workflows.
33
+ - [**MCP Compatibility**](https://docs.nvidia.com/agentiq/latest/components/mcp.html) Compatible with Model Context Protocol (MCP), allowing tools served by MCP Servers to be used as AgentIQ functions.
34
+
35
+ With AgentIQ, you can move quickly, experiment freely, and ensure reliability across all your agent-driven projects.
36
+
37
+ ## Links
38
+ * [Documentation](https://docs.nvidia.com/agentiq/latest/index.html): Explore the full documentation for AgentIQ.
39
+ * [About AgentIQ](https://docs.nvidia.com/agentiq/latest/intro/why-agentiq.html): Learn more about the benefits of using AgentIQ.
40
+
41
+ ## First time user?
42
+ If this is your first time using AgentIQ, it is recommended to install the latest version from the [source repository](https://github.com/NVIDIA/AgentIQ?tab=readme-ov-file#get-started) on GitHub. This package is intended for users who are familiar with AgentIQ applications and need to add AgentIQ as a dependency to their project.
43
+
44
+ ## Feedback
45
+
46
+ We would love to hear from you! Please file an issue on [GitHub](https://github.com/NVIDIA/AgentIQ/issues) if you have any feedback or feature requests.
47
+
48
+ ## Acknowledgements
49
+
50
+ We would like to thank the following open source projects that made AgentIQ possible:
51
+
52
+ - [CrewAI](https://github.com/crewAIInc/crewAI)
53
+ - [FastAPI](https://github.com/tiangolo/fastapi)
54
+ - [LangChain](https://github.com/langchain-ai/langchain)
55
+ - [Llama-Index](https://github.com/run-llama/llama_index)
56
+ - [Mem0ai](https://github.com/mem0ai/mem0)
57
+ - [Ragas](https://github.com/explodinggradients/ragas)
58
+ - [Semantic Kernel](https://github.com/microsoft/semantic-kernel)
59
+ - [uv](https://github.com/astral-sh/uv)
File without changes
@@ -0,0 +1,270 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import logging
17
+ import re
18
+ from contextlib import asynccontextmanager
19
+ from typing import Any
20
+
21
+ from openinference.semconv.trace import OpenInferenceSpanKindValues
22
+ from openinference.semconv.trace import SpanAttributes
23
+ from opentelemetry import trace
24
+ from opentelemetry.sdk.trace import TracerProvider
25
+ from opentelemetry.trace import Span
26
+ from opentelemetry.trace.propagation import set_span_in_context
27
+ from pydantic import TypeAdapter
28
+
29
+ from aiq.builder.context import AIQContextState
30
+ from aiq.data_models.intermediate_step import IntermediateStep
31
+ from aiq.data_models.intermediate_step import IntermediateStepState
32
+
33
+ logger = logging.getLogger(__name__)
34
+
35
+ OPENINFERENCE_SPAN_KIND = SpanAttributes.OPENINFERENCE_SPAN_KIND
36
+
37
+
38
+ def _ns_timestamp(seconds_float: float) -> int:
39
+ """
40
+ Convert AgentIQ’s float `event_timestamp` (in seconds) into an integer number
41
+ of nanoseconds, as OpenTelemetry expects.
42
+ """
43
+ return int(seconds_float * 1e9)
44
+
45
+
46
+ class AsyncOtelSpanListener:
47
+ """
48
+ A separate, async class that listens to the AgentIQ intermediate step
49
+ event stream and creates proper Otel spans:
50
+
51
+ - On FUNCTION_START => open a new top-level span
52
+ - On any other intermediate step => open a child subspan (immediate open/close)
53
+ - On FUNCTION_END => close the function’s top-level span
54
+
55
+ This runs fully independently from the normal AgentIQ workflow, so that
56
+ the workflow is not blocking or entangled by OTel calls.
57
+ """
58
+
59
+ def __init__(self, context_state: AIQContextState | None = None):
60
+ """
61
+ :param context_state: Optionally supply a specific AIQContextState.
62
+ If None, uses the global singleton.
63
+ """
64
+ self._context_state = context_state or AIQContextState.get()
65
+
66
+ # Maintain a subscription so we can unsubscribe on shutdown
67
+ self._subscription = None
68
+
69
+ # Outstanding spans which have been opened but not yet closed
70
+ self._outstanding_spans: dict[str, Span] = {}
71
+
72
+ # Stack of spans, for when we need to create a child span
73
+ self._span_stack: list[Span] = []
74
+
75
+ self._running = False
76
+
77
+ # Prepare the tracer (optionally you might already have done this)
78
+ if trace.get_tracer_provider() is None or not isinstance(trace.get_tracer_provider(), TracerProvider):
79
+ tracer_provider = TracerProvider()
80
+ trace.set_tracer_provider(tracer_provider)
81
+
82
+ # We’ll optionally attach exporters if you want (out of scope to do it here).
83
+ # Example: tracer_provider.add_span_processor(BatchSpanProcessor(your_exporter))
84
+
85
+ self._tracer = trace.get_tracer("aiq-async-otel-listener")
86
+
87
+ def _on_next(self, step: IntermediateStep) -> None:
88
+ """
89
+ The main logic that reacts to each IntermediateStep.
90
+ """
91
+ if (step.event_state == IntermediateStepState.START):
92
+
93
+ self._process_start_event(step)
94
+
95
+ elif (step.event_state == IntermediateStepState.END):
96
+
97
+ self._process_end_event(step)
98
+
99
+ def _on_error(self, exc: Exception) -> None:
100
+ logger.error("Error in intermediate step subscription: %s", exc, exc_info=True)
101
+
102
+ def _on_complete(self) -> None:
103
+ logger.debug("Intermediate step stream completed. No more events will arrive.")
104
+
105
+ @asynccontextmanager
106
+ async def start(self):
107
+ """
108
+ Usage::
109
+
110
+ otel_listener = AsyncOtelSpanListener()
111
+ async with otel_listener.start():
112
+ # run your AgentIQ workflow
113
+ ...
114
+ # cleans up
115
+
116
+ This sets up the subscription to the AgentIQ event stream and starts the background loop.
117
+ """
118
+ try:
119
+ # Subscribe to the event stream
120
+ subject = self._context_state.event_stream.get()
121
+ self._subscription = subject.subscribe(
122
+ on_next=self._on_next,
123
+ on_error=self._on_error,
124
+ on_complete=self._on_complete,
125
+ )
126
+
127
+ self._running = True
128
+
129
+ yield # let the caller do their workflow
130
+
131
+ finally:
132
+ # Cleanup
133
+ self._running = False
134
+ # Close out any running spans
135
+ await self._cleanup()
136
+
137
+ if self._subscription:
138
+ self._subscription.unsubscribe()
139
+ self._subscription = None
140
+
141
+ async def _cleanup(self):
142
+ """
143
+ Close any remaining open spans.
144
+ """
145
+ if self._outstanding_spans:
146
+ logger.warning(
147
+ "Not all spans were closed. Ensure all start events have a corresponding end event. Remaining: %s",
148
+ self._outstanding_spans)
149
+
150
+ for span_info in self._outstanding_spans.values():
151
+ span_info.end()
152
+
153
+ self._outstanding_spans.clear()
154
+
155
+ if self._span_stack:
156
+ logger.error(
157
+ "Not all spans were closed. Ensure all start events have a corresponding end event. Remaining: %s",
158
+ self._span_stack)
159
+
160
+ self._span_stack.clear()
161
+
162
+ def _serialize_payload(self, input_value: Any) -> tuple[str, bool]:
163
+ """
164
+ Serialize the input value to a string. Returns a tuple with the serialized value and a boolean indicating if the
165
+ serialization is JSON or a string
166
+ """
167
+ try:
168
+ return TypeAdapter(type(input_value)).dump_json(input_value).decode('utf-8'), True
169
+ except Exception:
170
+ # Fallback to string representation if we can't serialize using pydantic
171
+ return str(input_value), False
172
+
173
+ def _process_start_event(self, step: IntermediateStep):
174
+
175
+ parent_ctx = None
176
+
177
+ if (len(self._span_stack) > 0):
178
+ parent_span = self._span_stack[-1]
179
+
180
+ parent_ctx = set_span_in_context(parent_span)
181
+
182
+ # Extract start/end times from the step
183
+ # By convention, `span_event_timestamp` is the time we started, `event_timestamp` is the time we ended.
184
+ # If span_event_timestamp is missing, we default to event_timestamp (meaning zero-length).
185
+ s_ts = step.payload.span_event_timestamp or step.payload.event_timestamp
186
+ start_ns = _ns_timestamp(s_ts)
187
+
188
+ # Optional: embed the LLM/tool name if present
189
+ if step.payload.name:
190
+ sub_span_name = f"{step.payload.name}"
191
+ else:
192
+ sub_span_name = f"{step.payload.event_type}"
193
+
194
+ # Start the subspan
195
+ sub_span = self._tracer.start_span(
196
+ name=sub_span_name,
197
+ context=parent_ctx,
198
+ attributes={
199
+ "aiq.event_type": step.payload.event_type.value,
200
+ "aiq.function.id": step.function_ancestry.function_id,
201
+ "aiq.function.name": step.function_ancestry.function_name,
202
+ "aiq.subspan.name": step.payload.name or "",
203
+ "aiq.event_timestamp": step.event_timestamp,
204
+ "aiq.framework": step.payload.framework.value if step.payload.framework else "unknown",
205
+ },
206
+ start_time=start_ns,
207
+ )
208
+
209
+ event_type_to_span_kind = {
210
+ "LLM_START": OpenInferenceSpanKindValues.LLM,
211
+ "LLM_END": OpenInferenceSpanKindValues.LLM,
212
+ "LLM_NEW_TOKEN": OpenInferenceSpanKindValues.LLM,
213
+ "TOOL_START": OpenInferenceSpanKindValues.TOOL,
214
+ "TOOL_END": OpenInferenceSpanKindValues.TOOL,
215
+ "FUNCTION_START": OpenInferenceSpanKindValues.CHAIN,
216
+ "FUNCTION_END": OpenInferenceSpanKindValues.CHAIN,
217
+ }
218
+
219
+ span_kind = event_type_to_span_kind.get(step.event_type, OpenInferenceSpanKindValues.UNKNOWN)
220
+ sub_span.set_attribute(SpanAttributes.OPENINFERENCE_SPAN_KIND, span_kind.value)
221
+
222
+ if step.payload.data and step.payload.data.input:
223
+ # optional parse
224
+ match = re.search(r"Human:\s*Question:\s*(.*)", str(step.payload.data.input))
225
+ if match:
226
+ human_question = match.group(1).strip()
227
+ sub_span.set_attribute(SpanAttributes.INPUT_VALUE, human_question)
228
+ else:
229
+ serialized_input, is_json = self._serialize_payload(step.payload.data.input)
230
+ sub_span.set_attribute(SpanAttributes.INPUT_VALUE, serialized_input)
231
+ sub_span.set_attribute(SpanAttributes.INPUT_MIME_TYPE, "application/json" if is_json else "text/plain")
232
+
233
+ self._span_stack.append(sub_span)
234
+
235
+ self._outstanding_spans[step.UUID] = sub_span
236
+
237
+ def _process_end_event(self, step: IntermediateStep):
238
+
239
+ # Find the subspan that was created in the start event
240
+ sub_span = self._outstanding_spans.pop(step.UUID, None)
241
+
242
+ if sub_span is None:
243
+ logger.warning("No subspan found for step %s", step.UUID)
244
+ return
245
+
246
+ self._span_stack.pop()
247
+
248
+ # Optionally add more attributes from usage_info or data
249
+ usage_info = step.payload.usage_info
250
+ if usage_info:
251
+ sub_span.set_attribute("aiq.usage.num_llm_calls",
252
+ usage_info.num_llm_calls if usage_info.num_llm_calls else 0)
253
+ sub_span.set_attribute("aiq.usage.seconds_between_calls",
254
+ usage_info.seconds_between_calls if usage_info.seconds_between_calls else 0)
255
+ sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_PROMPT,
256
+ usage_info.token_usage.prompt_tokens if usage_info.token_usage else 0)
257
+ sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_COMPLETION,
258
+ usage_info.token_usage.completion_tokens if usage_info.token_usage else 0)
259
+ sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_TOTAL,
260
+ usage_info.token_usage.total_tokens if usage_info.token_usage else 0)
261
+
262
+ if step.payload.data and step.payload.data.output is not None:
263
+ serialized_output, is_json = self._serialize_payload(step.payload.data.output)
264
+ sub_span.set_attribute(SpanAttributes.OUTPUT_VALUE, serialized_output)
265
+ sub_span.set_attribute(SpanAttributes.OUTPUT_MIME_TYPE, "application/json" if is_json else "text/plain")
266
+
267
+ end_ns = _ns_timestamp(step.payload.event_timestamp)
268
+
269
+ # End the subspan
270
+ sub_span.end(end_time=end_ns)