aiqtoolkit 1.1.0a20250429__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of aiqtoolkit might be problematic. Click here for more details.
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +76 -0
- aiq/agent/dual_node.py +67 -0
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +322 -0
- aiq/agent/react_agent/output_parser.py +104 -0
- aiq/agent/react_agent/prompt.py +46 -0
- aiq/agent/react_agent/register.py +148 -0
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +224 -0
- aiq/agent/register.py +23 -0
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +410 -0
- aiq/agent/rewoo_agent/prompt.py +108 -0
- aiq/agent/rewoo_agent/register.py +158 -0
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +123 -0
- aiq/agent/tool_calling_agent/register.py +105 -0
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +223 -0
- aiq/builder/component_utils.py +303 -0
- aiq/builder/context.py +198 -0
- aiq/builder/embedder.py +24 -0
- aiq/builder/eval_builder.py +116 -0
- aiq/builder/evaluator.py +29 -0
- aiq/builder/framework_enum.py +24 -0
- aiq/builder/front_end.py +73 -0
- aiq/builder/function.py +297 -0
- aiq/builder/function_base.py +372 -0
- aiq/builder/function_info.py +627 -0
- aiq/builder/intermediate_step_manager.py +125 -0
- aiq/builder/llm.py +25 -0
- aiq/builder/retriever.py +25 -0
- aiq/builder/user_interaction_manager.py +71 -0
- aiq/builder/workflow.py +134 -0
- aiq/builder/workflow_builder.py +733 -0
- aiq/cli/__init__.py +14 -0
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +233 -0
- aiq/cli/cli_utils/validation.py +37 -0
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +28 -0
- aiq/cli/commands/configure/channel/channel.py +34 -0
- aiq/cli/commands/configure/channel/remove.py +30 -0
- aiq/cli/commands/configure/channel/update.py +30 -0
- aiq/cli/commands/configure/configure.py +33 -0
- aiq/cli/commands/evaluate.py +139 -0
- aiq/cli/commands/info/__init__.py +14 -0
- aiq/cli/commands/info/info.py +37 -0
- aiq/cli/commands/info/list_channels.py +32 -0
- aiq/cli/commands/info/list_components.py +129 -0
- aiq/cli/commands/registry/__init__.py +14 -0
- aiq/cli/commands/registry/publish.py +88 -0
- aiq/cli/commands/registry/pull.py +118 -0
- aiq/cli/commands/registry/registry.py +36 -0
- aiq/cli/commands/registry/remove.py +108 -0
- aiq/cli/commands/registry/search.py +155 -0
- aiq/cli/commands/start.py +250 -0
- aiq/cli/commands/uninstall.py +83 -0
- aiq/cli/commands/validate.py +47 -0
- aiq/cli/commands/workflow/__init__.py +14 -0
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
- aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- aiq/cli/commands/workflow/workflow.py +37 -0
- aiq/cli/commands/workflow/workflow_commands.py +307 -0
- aiq/cli/entrypoint.py +133 -0
- aiq/cli/main.py +44 -0
- aiq/cli/register_workflow.py +408 -0
- aiq/cli/type_registry.py +869 -0
- aiq/data_models/__init__.py +14 -0
- aiq/data_models/api_server.py +550 -0
- aiq/data_models/common.py +143 -0
- aiq/data_models/component.py +46 -0
- aiq/data_models/component_ref.py +135 -0
- aiq/data_models/config.py +349 -0
- aiq/data_models/dataset_handler.py +122 -0
- aiq/data_models/discovery_metadata.py +269 -0
- aiq/data_models/embedder.py +26 -0
- aiq/data_models/evaluate.py +101 -0
- aiq/data_models/evaluator.py +26 -0
- aiq/data_models/front_end.py +26 -0
- aiq/data_models/function.py +30 -0
- aiq/data_models/function_dependencies.py +64 -0
- aiq/data_models/interactive.py +237 -0
- aiq/data_models/intermediate_step.py +269 -0
- aiq/data_models/invocation_node.py +38 -0
- aiq/data_models/llm.py +26 -0
- aiq/data_models/logging.py +26 -0
- aiq/data_models/memory.py +26 -0
- aiq/data_models/profiler.py +53 -0
- aiq/data_models/registry_handler.py +26 -0
- aiq/data_models/retriever.py +30 -0
- aiq/data_models/step_adaptor.py +64 -0
- aiq/data_models/streaming.py +33 -0
- aiq/data_models/swe_bench_model.py +54 -0
- aiq/data_models/telemetry_exporter.py +26 -0
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +41 -0
- aiq/embedder/nim_embedder.py +58 -0
- aiq/embedder/openai_embedder.py +42 -0
- aiq/embedder/register.py +24 -0
- aiq/eval/__init__.py +14 -0
- aiq/eval/config.py +42 -0
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +106 -0
- aiq/eval/dataset_handler/dataset_filter.py +52 -0
- aiq/eval/dataset_handler/dataset_handler.py +164 -0
- aiq/eval/evaluate.py +322 -0
- aiq/eval/evaluator/__init__.py +14 -0
- aiq/eval/evaluator/evaluator_model.py +44 -0
- aiq/eval/intermediate_step_adapter.py +93 -0
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +138 -0
- aiq/eval/rag_evaluator/register.py +138 -0
- aiq/eval/register.py +22 -0
- aiq/eval/remote_workflow.py +128 -0
- aiq/eval/runtime_event_subscriber.py +52 -0
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
- aiq/eval/swe_bench_evaluator/register.py +36 -0
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +118 -0
- aiq/eval/trajectory_evaluator/register.py +40 -0
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +131 -0
- aiq/eval/utils/tqdm_position_registry.py +40 -0
- aiq/front_ends/__init__.py +14 -0
- aiq/front_ends/console/__init__.py +14 -0
- aiq/front_ends/console/console_front_end_config.py +32 -0
- aiq/front_ends/console/console_front_end_plugin.py +107 -0
- aiq/front_ends/console/register.py +25 -0
- aiq/front_ends/cron/__init__.py +14 -0
- aiq/front_ends/fastapi/__init__.py +14 -0
- aiq/front_ends/fastapi/fastapi_front_end_config.py +150 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +103 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +574 -0
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- aiq/front_ends/fastapi/job_store.py +161 -0
- aiq/front_ends/fastapi/main.py +70 -0
- aiq/front_ends/fastapi/message_handler.py +279 -0
- aiq/front_ends/fastapi/message_validator.py +345 -0
- aiq/front_ends/fastapi/register.py +25 -0
- aiq/front_ends/fastapi/response_helpers.py +181 -0
- aiq/front_ends/fastapi/step_adaptor.py +315 -0
- aiq/front_ends/fastapi/websocket.py +148 -0
- aiq/front_ends/mcp/__init__.py +14 -0
- aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
- aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
- aiq/front_ends/mcp/register.py +27 -0
- aiq/front_ends/mcp/tool_converter.py +242 -0
- aiq/front_ends/register.py +22 -0
- aiq/front_ends/simple_base/__init__.py +14 -0
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +52 -0
- aiq/llm/__init__.py +0 -0
- aiq/llm/nim_llm.py +45 -0
- aiq/llm/openai_llm.py +45 -0
- aiq/llm/register.py +22 -0
- aiq/llm/utils/__init__.py +14 -0
- aiq/llm/utils/env_config_value.py +94 -0
- aiq/llm/utils/error.py +17 -0
- aiq/memory/__init__.py +20 -0
- aiq/memory/interfaces.py +183 -0
- aiq/memory/models.py +102 -0
- aiq/meta/module_to_distro.json +3 -0
- aiq/meta/pypi.md +59 -0
- aiq/observability/__init__.py +0 -0
- aiq/observability/async_otel_listener.py +270 -0
- aiq/observability/register.py +97 -0
- aiq/plugins/.namespace +1 -0
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +295 -0
- aiq/profiler/callbacks/base_callback_class.py +20 -0
- aiq/profiler/callbacks/langchain_callback_handler.py +278 -0
- aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- aiq/profiler/callbacks/token_usage_base_model.py +27 -0
- aiq/profiler/data_frame_row.py +51 -0
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +131 -0
- aiq/profiler/decorators/function_tracking.py +254 -0
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +18 -0
- aiq/profiler/forecasting/model_trainer.py +75 -0
- aiq/profiler/forecasting/models/__init__.py +22 -0
- aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
- aiq/profiler/forecasting/models/linear_model.py +196 -0
- aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
- aiq/profiler/inference_metrics_model.py +25 -0
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +452 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- aiq/profiler/inference_optimization/data_models.py +386 -0
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- aiq/profiler/inference_optimization/llm_metrics.py +212 -0
- aiq/profiler/inference_optimization/prompt_caching.py +163 -0
- aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
- aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
- aiq/profiler/intermediate_property_adapter.py +102 -0
- aiq/profiler/profile_runner.py +433 -0
- aiq/profiler/utils.py +184 -0
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +176 -0
- aiq/registry_handlers/local/register_local.py +37 -0
- aiq/registry_handlers/metadata_factory.py +60 -0
- aiq/registry_handlers/package_utils.py +198 -0
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +251 -0
- aiq/registry_handlers/pypi/register_pypi.py +40 -0
- aiq/registry_handlers/register.py +21 -0
- aiq/registry_handlers/registry_handler_base.py +157 -0
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +56 -0
- aiq/registry_handlers/rest/rest_handler.py +237 -0
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +42 -0
- aiq/registry_handlers/schemas/package.py +68 -0
- aiq/registry_handlers/schemas/publish.py +63 -0
- aiq/registry_handlers/schemas/pull.py +81 -0
- aiq/registry_handlers/schemas/remove.py +36 -0
- aiq/registry_handlers/schemas/search.py +91 -0
- aiq/registry_handlers/schemas/status.py +47 -0
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +37 -0
- aiq/retriever/milvus/__init__.py +14 -0
- aiq/retriever/milvus/register.py +81 -0
- aiq/retriever/milvus/retriever.py +228 -0
- aiq/retriever/models.py +74 -0
- aiq/retriever/nemo_retriever/__init__.py +14 -0
- aiq/retriever/nemo_retriever/register.py +60 -0
- aiq/retriever/nemo_retriever/retriever.py +190 -0
- aiq/retriever/register.py +22 -0
- aiq/runtime/__init__.py +14 -0
- aiq/runtime/loader.py +188 -0
- aiq/runtime/runner.py +176 -0
- aiq/runtime/session.py +116 -0
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +318 -0
- aiq/test/.namespace +1 -0
- aiq/tool/__init__.py +0 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +188 -0
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +79 -0
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +4 -0
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +25 -0
- aiq/tool/code_execution/register.py +70 -0
- aiq/tool/code_execution/utils.py +100 -0
- aiq/tool/datetime_tools.py +42 -0
- aiq/tool/document_search.py +141 -0
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +133 -0
- aiq/tool/github_tools/create_github_issue.py +87 -0
- aiq/tool/github_tools/create_github_pr.py +106 -0
- aiq/tool/github_tools/get_github_file.py +106 -0
- aiq/tool/github_tools/get_github_issue.py +166 -0
- aiq/tool/github_tools/get_github_pr.py +256 -0
- aiq/tool/github_tools/update_github_issue.py +100 -0
- aiq/tool/mcp/__init__.py +14 -0
- aiq/tool/mcp/mcp_client.py +220 -0
- aiq/tool/mcp/mcp_tool.py +75 -0
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +67 -0
- aiq/tool/memory_tools/delete_memory_tool.py +67 -0
- aiq/tool/memory_tools/get_memory_tool.py +72 -0
- aiq/tool/nvidia_rag.py +95 -0
- aiq/tool/register.py +36 -0
- aiq/tool/retriever.py +89 -0
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +58 -0
- aiq/utils/debugging_utils.py +43 -0
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/schemas.py +114 -0
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/yaml_tools.py +50 -0
- aiq/utils/metadata_utils.py +74 -0
- aiq/utils/producer_consumer_queue.py +178 -0
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +65 -0
- aiq/utils/reactive/base/observer_base.py +55 -0
- aiq/utils/reactive/base/subject_base.py +79 -0
- aiq/utils/reactive/observable.py +59 -0
- aiq/utils/reactive/observer.py +76 -0
- aiq/utils/reactive/subject.py +131 -0
- aiq/utils/reactive/subscription.py +49 -0
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +197 -0
- aiq/utils/type_converter.py +232 -0
- aiq/utils/type_utils.py +397 -0
- aiq/utils/url_utils.py +27 -0
- aiqtoolkit-1.1.0a20250429.dist-info/METADATA +326 -0
- aiqtoolkit-1.1.0a20250429.dist-info/RECORD +309 -0
- aiqtoolkit-1.1.0a20250429.dist-info/WHEEL +5 -0
- aiqtoolkit-1.1.0a20250429.dist-info/entry_points.txt +17 -0
- aiqtoolkit-1.1.0a20250429.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
- aiqtoolkit-1.1.0a20250429.dist-info/licenses/LICENSE.md +201 -0
- aiqtoolkit-1.1.0a20250429.dist-info/top_level.txt +1 -0
aiq/memory/interfaces.py
ADDED
|
@@ -0,0 +1,183 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from abc import ABC
|
|
17
|
+
from abc import abstractmethod
|
|
18
|
+
from collections.abc import Callable
|
|
19
|
+
|
|
20
|
+
from .models import MemoryItem
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
class MemoryEditor(ABC):
|
|
24
|
+
"""
|
|
25
|
+
Abstract interface for editing and
|
|
26
|
+
retrieving memory items.
|
|
27
|
+
|
|
28
|
+
A MemoryEditor is responsible for adding, searching, and
|
|
29
|
+
removing MemoryItems.
|
|
30
|
+
|
|
31
|
+
Implementations may integrate with
|
|
32
|
+
vector stores or other indexing backends.
|
|
33
|
+
"""
|
|
34
|
+
|
|
35
|
+
@abstractmethod
|
|
36
|
+
async def add_items(self, items: list[MemoryItem]) -> None:
|
|
37
|
+
"""
|
|
38
|
+
Insert multiple MemoryItems into the memory.
|
|
39
|
+
|
|
40
|
+
Args:
|
|
41
|
+
items (list[MemoryItem]): The items to be added.
|
|
42
|
+
"""
|
|
43
|
+
raise NotImplementedError
|
|
44
|
+
|
|
45
|
+
@abstractmethod
|
|
46
|
+
async def search(self, query: str, top_k: int = 5, **kwargs) -> list[MemoryItem]:
|
|
47
|
+
"""
|
|
48
|
+
Retrieve items relevant to the given query.
|
|
49
|
+
Relevance criteria depend on implementation.
|
|
50
|
+
|
|
51
|
+
Args:
|
|
52
|
+
query (str): The query string to match.
|
|
53
|
+
top_k (int): Maximum number of items to return.
|
|
54
|
+
kwargs (dict): Keyword arguments to pass to the search method.
|
|
55
|
+
|
|
56
|
+
Returns:
|
|
57
|
+
list[MemoryItem]: The most relevant MemoryItems.
|
|
58
|
+
"""
|
|
59
|
+
raise NotImplementedError
|
|
60
|
+
|
|
61
|
+
@abstractmethod
|
|
62
|
+
async def remove_items(self, **kwargs) -> None:
|
|
63
|
+
"""
|
|
64
|
+
Remove items. Additional parameters
|
|
65
|
+
needed for deletion can be specified in keyword arguments.
|
|
66
|
+
|
|
67
|
+
Args:
|
|
68
|
+
kwargs (dict): Keyword arguments to pass to the remove-items method.
|
|
69
|
+
"""
|
|
70
|
+
raise NotImplementedError
|
|
71
|
+
|
|
72
|
+
|
|
73
|
+
class MemoryIOBase(ABC):
|
|
74
|
+
"""
|
|
75
|
+
Base abstract class for I/O operations
|
|
76
|
+
on memory, providing a common interface for
|
|
77
|
+
|
|
78
|
+
MemoryReader and MemoryWriter to interact
|
|
79
|
+
with a MemoryEditor.
|
|
80
|
+
|
|
81
|
+
Concrete subclasses should hold a
|
|
82
|
+
reference to a MemoryEditor instance.
|
|
83
|
+
"""
|
|
84
|
+
|
|
85
|
+
def __init__(self, editor: MemoryEditor) -> None:
|
|
86
|
+
self._editor = editor
|
|
87
|
+
|
|
88
|
+
|
|
89
|
+
class MemoryReader(MemoryIOBase):
|
|
90
|
+
"""
|
|
91
|
+
Responsible for retrieving MemoryItems
|
|
92
|
+
from the MemoryEditor based on context or queries.
|
|
93
|
+
"""
|
|
94
|
+
|
|
95
|
+
@abstractmethod
|
|
96
|
+
async def retrieve(self, context: str, top_k: int = 5) -> list[MemoryItem]:
|
|
97
|
+
"""
|
|
98
|
+
Retrieve a subset of
|
|
99
|
+
MemoryItems relevant to the provided context.
|
|
100
|
+
|
|
101
|
+
Args:
|
|
102
|
+
context (str): A string representing
|
|
103
|
+
the current user context or query.
|
|
104
|
+
top_k (int): Maximum number of items to return.
|
|
105
|
+
|
|
106
|
+
Returns:
|
|
107
|
+
list[MemoryItem]: Relevant MemoryItems.
|
|
108
|
+
"""
|
|
109
|
+
raise NotImplementedError
|
|
110
|
+
|
|
111
|
+
|
|
112
|
+
class MemoryWriter(MemoryIOBase):
|
|
113
|
+
"""
|
|
114
|
+
Responsible for converting new observations
|
|
115
|
+
(textual inputs) into MemoryItems andstoring
|
|
116
|
+
them via the MemoryEditor.
|
|
117
|
+
"""
|
|
118
|
+
|
|
119
|
+
@abstractmethod
|
|
120
|
+
async def write(self, observation: str, context: str | None = None) -> list[MemoryItem]:
|
|
121
|
+
"""
|
|
122
|
+
Process the given observation and store the resulting MemoryItems.
|
|
123
|
+
|
|
124
|
+
Args:
|
|
125
|
+
observation (str): The new textual input to record.
|
|
126
|
+
context (Optional[str]): Additional
|
|
127
|
+
context that might influence how the observation is stored.
|
|
128
|
+
|
|
129
|
+
Returns:
|
|
130
|
+
list[MemoryItem]: The newly created MemoryItems.
|
|
131
|
+
"""
|
|
132
|
+
raise NotImplementedError
|
|
133
|
+
|
|
134
|
+
|
|
135
|
+
class MemoryManager(ABC):
|
|
136
|
+
"""
|
|
137
|
+
Manages the lifecycle of the stored
|
|
138
|
+
memory by applying policies such as summarization,
|
|
139
|
+
reflection, forgetting, and mergingn
|
|
140
|
+
to ensure long-term coherence and relevance.
|
|
141
|
+
"""
|
|
142
|
+
|
|
143
|
+
@abstractmethod
|
|
144
|
+
async def summarize(self) -> None:
|
|
145
|
+
"""
|
|
146
|
+
Summarize long or numerous MemoryItems into a more compact form.
|
|
147
|
+
This may remove the original items and store a new summary item.
|
|
148
|
+
"""
|
|
149
|
+
raise NotImplementedError
|
|
150
|
+
|
|
151
|
+
@abstractmethod
|
|
152
|
+
async def reflect(self) -> None:
|
|
153
|
+
"""
|
|
154
|
+
Generate higher-level insights or
|
|
155
|
+
abstractions from existing MemoryItems.
|
|
156
|
+
This may call out to an LLM or other
|
|
157
|
+
logic to produce conceptual memory.
|
|
158
|
+
"""
|
|
159
|
+
raise NotImplementedError
|
|
160
|
+
|
|
161
|
+
@abstractmethod
|
|
162
|
+
async def forget(self, criteria: Callable[[MemoryItem], bool]) -> None:
|
|
163
|
+
"""
|
|
164
|
+
Remove MemoryItems that are no
|
|
165
|
+
longer relevant or have low importance.
|
|
166
|
+
|
|
167
|
+
Args:
|
|
168
|
+
criteria (Callable[[MemoryItem], bool]): A function that
|
|
169
|
+
returns True for items to forget.
|
|
170
|
+
"""
|
|
171
|
+
raise NotImplementedError
|
|
172
|
+
|
|
173
|
+
@abstractmethod
|
|
174
|
+
async def merge(self, criteria: Callable[[MemoryItem, MemoryItem], bool]) -> None:
|
|
175
|
+
"""
|
|
176
|
+
Merge similar or redundant MemoryItems
|
|
177
|
+
into a smaller set of more concise items.
|
|
178
|
+
|
|
179
|
+
Args:
|
|
180
|
+
criteria (Callable[[MemoryItem, MemoryItem], bool]): A function
|
|
181
|
+
that determines which items can be merged.
|
|
182
|
+
"""
|
|
183
|
+
raise NotImplementedError
|
aiq/memory/models.py
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from pydantic import BaseModel
|
|
19
|
+
from pydantic import ConfigDict
|
|
20
|
+
from pydantic import Field
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
class MemoryItem(BaseModel):
|
|
24
|
+
"""
|
|
25
|
+
Represents a single memory item consisting of structured content and associated metadata.
|
|
26
|
+
|
|
27
|
+
Attributes
|
|
28
|
+
----------
|
|
29
|
+
conversation : list[dict[str, str]]
|
|
30
|
+
A list of dictionaries, each containing string key-value pairs.
|
|
31
|
+
user_id : str
|
|
32
|
+
Unique identifier for this MemoryItem's user.
|
|
33
|
+
tags : list[str]
|
|
34
|
+
A list of strings representing tags attached to the item.
|
|
35
|
+
metadata : dict[str, typing.Any]
|
|
36
|
+
Metadata providing context and utility for management operations.
|
|
37
|
+
memory : str or None
|
|
38
|
+
Optional memory string. Helpful when returning a memory.
|
|
39
|
+
"""
|
|
40
|
+
model_config = ConfigDict(
|
|
41
|
+
# Add an example for the schema
|
|
42
|
+
json_schema_extra={
|
|
43
|
+
"examples": [{
|
|
44
|
+
"conversation": [
|
|
45
|
+
{
|
|
46
|
+
"role": "user",
|
|
47
|
+
"content": "Hi, I'm Alex. I'm a vegetarian and I'm allergic to nuts.",
|
|
48
|
+
},
|
|
49
|
+
{
|
|
50
|
+
"role": "assistant",
|
|
51
|
+
"content": "Hello Alex! I've noted that you're a vegetarian and have a nut allergy.",
|
|
52
|
+
},
|
|
53
|
+
],
|
|
54
|
+
"user_id": "user_abc",
|
|
55
|
+
"metadata": {
|
|
56
|
+
"key_value_pairs": {
|
|
57
|
+
"type": "technology", "relevance": "high"
|
|
58
|
+
}
|
|
59
|
+
}
|
|
60
|
+
}]
|
|
61
|
+
},
|
|
62
|
+
# Allow population of models from arbitrary types (e.g., ORM objects)
|
|
63
|
+
arbitrary_types_allowed=True,
|
|
64
|
+
# Enable aliasing if needed
|
|
65
|
+
populate_by_name=True)
|
|
66
|
+
|
|
67
|
+
conversation: list[dict[str, str]] = Field(description="List of conversation messages. "
|
|
68
|
+
"Each message must have a \"role\" "
|
|
69
|
+
"key (user or assistant. It must "
|
|
70
|
+
"als have a \"content\" key.")
|
|
71
|
+
tags: list[str] = Field(default_factory=list, description="List of tags applied to the item.")
|
|
72
|
+
metadata: dict[str, typing.Any] = Field(description="Metadata about the memory item.")
|
|
73
|
+
user_id: str = Field(description="The user's ID.")
|
|
74
|
+
memory: str | None = Field(default=None)
|
|
75
|
+
|
|
76
|
+
|
|
77
|
+
class SearchMemoryInput(BaseModel):
|
|
78
|
+
"""
|
|
79
|
+
Represents a search memory input structure.
|
|
80
|
+
"""
|
|
81
|
+
model_config = ConfigDict(json_schema_extra={
|
|
82
|
+
"example": {
|
|
83
|
+
"query": "What is the user's preferred programming language?",
|
|
84
|
+
"top_k": 1,
|
|
85
|
+
"user_id": "user_abc",
|
|
86
|
+
}
|
|
87
|
+
})
|
|
88
|
+
|
|
89
|
+
query: str = Field(description="Search query for which to retrieve memory.") # noqa: E501
|
|
90
|
+
top_k: int = Field(description="Maximum number of memories to return")
|
|
91
|
+
user_id: str = Field(description="ID of the user to search for.")
|
|
92
|
+
|
|
93
|
+
|
|
94
|
+
class DeleteMemoryInput(BaseModel):
|
|
95
|
+
"""
|
|
96
|
+
Represents a delete memory input structure.
|
|
97
|
+
"""
|
|
98
|
+
model_config = ConfigDict(json_schema_extra={"example": {"user_id": "user_abc", }})
|
|
99
|
+
|
|
100
|
+
user_id: str = Field(description="ID of the user to delete memory for. Careful when using "
|
|
101
|
+
"this tool; make sure you use the "
|
|
102
|
+
"username present in the conversation.")
|
aiq/meta/pypi.md
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
1
|
+
<!--
|
|
2
|
+
SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
3
|
+
SPDX-License-Identifier: Apache-2.0
|
|
4
|
+
|
|
5
|
+
Licensed under the Apache License, Version 2.0 (the "License");
|
|
6
|
+
you may not use this file except in compliance with the License.
|
|
7
|
+
You may obtain a copy of the License at
|
|
8
|
+
|
|
9
|
+
http:/www.apache.org/licenses/LICENSE-2.0
|
|
10
|
+
|
|
11
|
+
Unless required by applicable law or agreed to in writing, software
|
|
12
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
|
13
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
14
|
+
See the License for the specific language governing permissions and
|
|
15
|
+
limitations under the License.
|
|
16
|
+
-->
|
|
17
|
+
|
|
18
|
+

|
|
19
|
+
|
|
20
|
+
# NVIDIA AgentIQ
|
|
21
|
+
|
|
22
|
+
AgentIQ is a flexible library designed to seamlessly integrate your enterprise agents—regardless of framework—with various data sources and tools. By treating agents, tools, and agentic workflows as simple function calls, AgentIQ enables true composability: build once and reuse anywhere.
|
|
23
|
+
|
|
24
|
+
## Key Features
|
|
25
|
+
|
|
26
|
+
- [**Framework Agnostic:**](https://docs.nvidia.com/agentiq/latest/concepts/plugins.html) Works with any agentic framework, so you can use your current technology stack without replatforming.
|
|
27
|
+
- [**Reusability:**](https://docs.nvidia.com/agentiq/latest/guides/sharing-workflows-and-tools.html) Every agent, tool, or workflow can be combined and repurposed, allowing developers to leverage existing work in new scenarios.
|
|
28
|
+
- [**Rapid Development:**](https://docs.nvidia.com/agentiq/latest/guides/create-customize-workflows.html) Start with a pre-built agent, tool, or workflow, and customize it to your needs.
|
|
29
|
+
- [**Profiling:**](https://docs.nvidia.com/agentiq/latest/guides/profiler.html) Profile entire workflows down to the tool and agent level, track input/output tokens and timings, and identify bottlenecks.
|
|
30
|
+
- [**Observability:**](https://docs.nvidia.com/agentiq/latest/guides/observe-workflow-with-phoenix.html) Monitor and debug your workflows with any OpenTelemetry-compatible observability tool.
|
|
31
|
+
- [**Evaluation System:**](https://docs.nvidia.com/agentiq/latest/guides/evaluate.html) Validate and maintain accuracy of agentic workflows with built-in evaluation tools.
|
|
32
|
+
- [**User Interface:**](https://docs.nvidia.com/agentiq/latest/guides/using-agentiq-ui-and-server.html) Use the AgentIQ UI chat interface to interact with your agents, visualize output, and debug workflows.
|
|
33
|
+
- [**MCP Compatibility**](https://docs.nvidia.com/agentiq/latest/components/mcp.html) Compatible with Model Context Protocol (MCP), allowing tools served by MCP Servers to be used as AgentIQ functions.
|
|
34
|
+
|
|
35
|
+
With AgentIQ, you can move quickly, experiment freely, and ensure reliability across all your agent-driven projects.
|
|
36
|
+
|
|
37
|
+
## Links
|
|
38
|
+
* [Documentation](https://docs.nvidia.com/agentiq/latest/index.html): Explore the full documentation for AgentIQ.
|
|
39
|
+
* [About AgentIQ](https://docs.nvidia.com/agentiq/latest/intro/why-agentiq.html): Learn more about the benefits of using AgentIQ.
|
|
40
|
+
|
|
41
|
+
## First time user?
|
|
42
|
+
If this is your first time using AgentIQ, it is recommended to install the latest version from the [source repository](https://github.com/NVIDIA/AgentIQ?tab=readme-ov-file#get-started) on GitHub. This package is intended for users who are familiar with AgentIQ applications and need to add AgentIQ as a dependency to their project.
|
|
43
|
+
|
|
44
|
+
## Feedback
|
|
45
|
+
|
|
46
|
+
We would love to hear from you! Please file an issue on [GitHub](https://github.com/NVIDIA/AgentIQ/issues) if you have any feedback or feature requests.
|
|
47
|
+
|
|
48
|
+
## Acknowledgements
|
|
49
|
+
|
|
50
|
+
We would like to thank the following open source projects that made AgentIQ possible:
|
|
51
|
+
|
|
52
|
+
- [CrewAI](https://github.com/crewAIInc/crewAI)
|
|
53
|
+
- [FastAPI](https://github.com/tiangolo/fastapi)
|
|
54
|
+
- [LangChain](https://github.com/langchain-ai/langchain)
|
|
55
|
+
- [Llama-Index](https://github.com/run-llama/llama_index)
|
|
56
|
+
- [Mem0ai](https://github.com/mem0ai/mem0)
|
|
57
|
+
- [Ragas](https://github.com/explodinggradients/ragas)
|
|
58
|
+
- [Semantic Kernel](https://github.com/microsoft/semantic-kernel)
|
|
59
|
+
- [uv](https://github.com/astral-sh/uv)
|
|
File without changes
|
|
@@ -0,0 +1,270 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
import re
|
|
18
|
+
from contextlib import asynccontextmanager
|
|
19
|
+
from typing import Any
|
|
20
|
+
|
|
21
|
+
from openinference.semconv.trace import OpenInferenceSpanKindValues
|
|
22
|
+
from openinference.semconv.trace import SpanAttributes
|
|
23
|
+
from opentelemetry import trace
|
|
24
|
+
from opentelemetry.sdk.trace import TracerProvider
|
|
25
|
+
from opentelemetry.trace import Span
|
|
26
|
+
from opentelemetry.trace.propagation import set_span_in_context
|
|
27
|
+
from pydantic import TypeAdapter
|
|
28
|
+
|
|
29
|
+
from aiq.builder.context import AIQContextState
|
|
30
|
+
from aiq.data_models.intermediate_step import IntermediateStep
|
|
31
|
+
from aiq.data_models.intermediate_step import IntermediateStepState
|
|
32
|
+
|
|
33
|
+
logger = logging.getLogger(__name__)
|
|
34
|
+
|
|
35
|
+
OPENINFERENCE_SPAN_KIND = SpanAttributes.OPENINFERENCE_SPAN_KIND
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
def _ns_timestamp(seconds_float: float) -> int:
|
|
39
|
+
"""
|
|
40
|
+
Convert AgentIQ’s float `event_timestamp` (in seconds) into an integer number
|
|
41
|
+
of nanoseconds, as OpenTelemetry expects.
|
|
42
|
+
"""
|
|
43
|
+
return int(seconds_float * 1e9)
|
|
44
|
+
|
|
45
|
+
|
|
46
|
+
class AsyncOtelSpanListener:
|
|
47
|
+
"""
|
|
48
|
+
A separate, async class that listens to the AgentIQ intermediate step
|
|
49
|
+
event stream and creates proper Otel spans:
|
|
50
|
+
|
|
51
|
+
- On FUNCTION_START => open a new top-level span
|
|
52
|
+
- On any other intermediate step => open a child subspan (immediate open/close)
|
|
53
|
+
- On FUNCTION_END => close the function’s top-level span
|
|
54
|
+
|
|
55
|
+
This runs fully independently from the normal AgentIQ workflow, so that
|
|
56
|
+
the workflow is not blocking or entangled by OTel calls.
|
|
57
|
+
"""
|
|
58
|
+
|
|
59
|
+
def __init__(self, context_state: AIQContextState | None = None):
|
|
60
|
+
"""
|
|
61
|
+
:param context_state: Optionally supply a specific AIQContextState.
|
|
62
|
+
If None, uses the global singleton.
|
|
63
|
+
"""
|
|
64
|
+
self._context_state = context_state or AIQContextState.get()
|
|
65
|
+
|
|
66
|
+
# Maintain a subscription so we can unsubscribe on shutdown
|
|
67
|
+
self._subscription = None
|
|
68
|
+
|
|
69
|
+
# Outstanding spans which have been opened but not yet closed
|
|
70
|
+
self._outstanding_spans: dict[str, Span] = {}
|
|
71
|
+
|
|
72
|
+
# Stack of spans, for when we need to create a child span
|
|
73
|
+
self._span_stack: list[Span] = []
|
|
74
|
+
|
|
75
|
+
self._running = False
|
|
76
|
+
|
|
77
|
+
# Prepare the tracer (optionally you might already have done this)
|
|
78
|
+
if trace.get_tracer_provider() is None or not isinstance(trace.get_tracer_provider(), TracerProvider):
|
|
79
|
+
tracer_provider = TracerProvider()
|
|
80
|
+
trace.set_tracer_provider(tracer_provider)
|
|
81
|
+
|
|
82
|
+
# We’ll optionally attach exporters if you want (out of scope to do it here).
|
|
83
|
+
# Example: tracer_provider.add_span_processor(BatchSpanProcessor(your_exporter))
|
|
84
|
+
|
|
85
|
+
self._tracer = trace.get_tracer("aiq-async-otel-listener")
|
|
86
|
+
|
|
87
|
+
def _on_next(self, step: IntermediateStep) -> None:
|
|
88
|
+
"""
|
|
89
|
+
The main logic that reacts to each IntermediateStep.
|
|
90
|
+
"""
|
|
91
|
+
if (step.event_state == IntermediateStepState.START):
|
|
92
|
+
|
|
93
|
+
self._process_start_event(step)
|
|
94
|
+
|
|
95
|
+
elif (step.event_state == IntermediateStepState.END):
|
|
96
|
+
|
|
97
|
+
self._process_end_event(step)
|
|
98
|
+
|
|
99
|
+
def _on_error(self, exc: Exception) -> None:
|
|
100
|
+
logger.error("Error in intermediate step subscription: %s", exc, exc_info=True)
|
|
101
|
+
|
|
102
|
+
def _on_complete(self) -> None:
|
|
103
|
+
logger.debug("Intermediate step stream completed. No more events will arrive.")
|
|
104
|
+
|
|
105
|
+
@asynccontextmanager
|
|
106
|
+
async def start(self):
|
|
107
|
+
"""
|
|
108
|
+
Usage::
|
|
109
|
+
|
|
110
|
+
otel_listener = AsyncOtelSpanListener()
|
|
111
|
+
async with otel_listener.start():
|
|
112
|
+
# run your AgentIQ workflow
|
|
113
|
+
...
|
|
114
|
+
# cleans up
|
|
115
|
+
|
|
116
|
+
This sets up the subscription to the AgentIQ event stream and starts the background loop.
|
|
117
|
+
"""
|
|
118
|
+
try:
|
|
119
|
+
# Subscribe to the event stream
|
|
120
|
+
subject = self._context_state.event_stream.get()
|
|
121
|
+
self._subscription = subject.subscribe(
|
|
122
|
+
on_next=self._on_next,
|
|
123
|
+
on_error=self._on_error,
|
|
124
|
+
on_complete=self._on_complete,
|
|
125
|
+
)
|
|
126
|
+
|
|
127
|
+
self._running = True
|
|
128
|
+
|
|
129
|
+
yield # let the caller do their workflow
|
|
130
|
+
|
|
131
|
+
finally:
|
|
132
|
+
# Cleanup
|
|
133
|
+
self._running = False
|
|
134
|
+
# Close out any running spans
|
|
135
|
+
await self._cleanup()
|
|
136
|
+
|
|
137
|
+
if self._subscription:
|
|
138
|
+
self._subscription.unsubscribe()
|
|
139
|
+
self._subscription = None
|
|
140
|
+
|
|
141
|
+
async def _cleanup(self):
|
|
142
|
+
"""
|
|
143
|
+
Close any remaining open spans.
|
|
144
|
+
"""
|
|
145
|
+
if self._outstanding_spans:
|
|
146
|
+
logger.warning(
|
|
147
|
+
"Not all spans were closed. Ensure all start events have a corresponding end event. Remaining: %s",
|
|
148
|
+
self._outstanding_spans)
|
|
149
|
+
|
|
150
|
+
for span_info in self._outstanding_spans.values():
|
|
151
|
+
span_info.end()
|
|
152
|
+
|
|
153
|
+
self._outstanding_spans.clear()
|
|
154
|
+
|
|
155
|
+
if self._span_stack:
|
|
156
|
+
logger.error(
|
|
157
|
+
"Not all spans were closed. Ensure all start events have a corresponding end event. Remaining: %s",
|
|
158
|
+
self._span_stack)
|
|
159
|
+
|
|
160
|
+
self._span_stack.clear()
|
|
161
|
+
|
|
162
|
+
def _serialize_payload(self, input_value: Any) -> tuple[str, bool]:
|
|
163
|
+
"""
|
|
164
|
+
Serialize the input value to a string. Returns a tuple with the serialized value and a boolean indicating if the
|
|
165
|
+
serialization is JSON or a string
|
|
166
|
+
"""
|
|
167
|
+
try:
|
|
168
|
+
return TypeAdapter(type(input_value)).dump_json(input_value).decode('utf-8'), True
|
|
169
|
+
except Exception:
|
|
170
|
+
# Fallback to string representation if we can't serialize using pydantic
|
|
171
|
+
return str(input_value), False
|
|
172
|
+
|
|
173
|
+
def _process_start_event(self, step: IntermediateStep):
|
|
174
|
+
|
|
175
|
+
parent_ctx = None
|
|
176
|
+
|
|
177
|
+
if (len(self._span_stack) > 0):
|
|
178
|
+
parent_span = self._span_stack[-1]
|
|
179
|
+
|
|
180
|
+
parent_ctx = set_span_in_context(parent_span)
|
|
181
|
+
|
|
182
|
+
# Extract start/end times from the step
|
|
183
|
+
# By convention, `span_event_timestamp` is the time we started, `event_timestamp` is the time we ended.
|
|
184
|
+
# If span_event_timestamp is missing, we default to event_timestamp (meaning zero-length).
|
|
185
|
+
s_ts = step.payload.span_event_timestamp or step.payload.event_timestamp
|
|
186
|
+
start_ns = _ns_timestamp(s_ts)
|
|
187
|
+
|
|
188
|
+
# Optional: embed the LLM/tool name if present
|
|
189
|
+
if step.payload.name:
|
|
190
|
+
sub_span_name = f"{step.payload.name}"
|
|
191
|
+
else:
|
|
192
|
+
sub_span_name = f"{step.payload.event_type}"
|
|
193
|
+
|
|
194
|
+
# Start the subspan
|
|
195
|
+
sub_span = self._tracer.start_span(
|
|
196
|
+
name=sub_span_name,
|
|
197
|
+
context=parent_ctx,
|
|
198
|
+
attributes={
|
|
199
|
+
"aiq.event_type": step.payload.event_type.value,
|
|
200
|
+
"aiq.function.id": step.function_ancestry.function_id,
|
|
201
|
+
"aiq.function.name": step.function_ancestry.function_name,
|
|
202
|
+
"aiq.subspan.name": step.payload.name or "",
|
|
203
|
+
"aiq.event_timestamp": step.event_timestamp,
|
|
204
|
+
"aiq.framework": step.payload.framework.value if step.payload.framework else "unknown",
|
|
205
|
+
},
|
|
206
|
+
start_time=start_ns,
|
|
207
|
+
)
|
|
208
|
+
|
|
209
|
+
event_type_to_span_kind = {
|
|
210
|
+
"LLM_START": OpenInferenceSpanKindValues.LLM,
|
|
211
|
+
"LLM_END": OpenInferenceSpanKindValues.LLM,
|
|
212
|
+
"LLM_NEW_TOKEN": OpenInferenceSpanKindValues.LLM,
|
|
213
|
+
"TOOL_START": OpenInferenceSpanKindValues.TOOL,
|
|
214
|
+
"TOOL_END": OpenInferenceSpanKindValues.TOOL,
|
|
215
|
+
"FUNCTION_START": OpenInferenceSpanKindValues.CHAIN,
|
|
216
|
+
"FUNCTION_END": OpenInferenceSpanKindValues.CHAIN,
|
|
217
|
+
}
|
|
218
|
+
|
|
219
|
+
span_kind = event_type_to_span_kind.get(step.event_type, OpenInferenceSpanKindValues.UNKNOWN)
|
|
220
|
+
sub_span.set_attribute(SpanAttributes.OPENINFERENCE_SPAN_KIND, span_kind.value)
|
|
221
|
+
|
|
222
|
+
if step.payload.data and step.payload.data.input:
|
|
223
|
+
# optional parse
|
|
224
|
+
match = re.search(r"Human:\s*Question:\s*(.*)", str(step.payload.data.input))
|
|
225
|
+
if match:
|
|
226
|
+
human_question = match.group(1).strip()
|
|
227
|
+
sub_span.set_attribute(SpanAttributes.INPUT_VALUE, human_question)
|
|
228
|
+
else:
|
|
229
|
+
serialized_input, is_json = self._serialize_payload(step.payload.data.input)
|
|
230
|
+
sub_span.set_attribute(SpanAttributes.INPUT_VALUE, serialized_input)
|
|
231
|
+
sub_span.set_attribute(SpanAttributes.INPUT_MIME_TYPE, "application/json" if is_json else "text/plain")
|
|
232
|
+
|
|
233
|
+
self._span_stack.append(sub_span)
|
|
234
|
+
|
|
235
|
+
self._outstanding_spans[step.UUID] = sub_span
|
|
236
|
+
|
|
237
|
+
def _process_end_event(self, step: IntermediateStep):
|
|
238
|
+
|
|
239
|
+
# Find the subspan that was created in the start event
|
|
240
|
+
sub_span = self._outstanding_spans.pop(step.UUID, None)
|
|
241
|
+
|
|
242
|
+
if sub_span is None:
|
|
243
|
+
logger.warning("No subspan found for step %s", step.UUID)
|
|
244
|
+
return
|
|
245
|
+
|
|
246
|
+
self._span_stack.pop()
|
|
247
|
+
|
|
248
|
+
# Optionally add more attributes from usage_info or data
|
|
249
|
+
usage_info = step.payload.usage_info
|
|
250
|
+
if usage_info:
|
|
251
|
+
sub_span.set_attribute("aiq.usage.num_llm_calls",
|
|
252
|
+
usage_info.num_llm_calls if usage_info.num_llm_calls else 0)
|
|
253
|
+
sub_span.set_attribute("aiq.usage.seconds_between_calls",
|
|
254
|
+
usage_info.seconds_between_calls if usage_info.seconds_between_calls else 0)
|
|
255
|
+
sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_PROMPT,
|
|
256
|
+
usage_info.token_usage.prompt_tokens if usage_info.token_usage else 0)
|
|
257
|
+
sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_COMPLETION,
|
|
258
|
+
usage_info.token_usage.completion_tokens if usage_info.token_usage else 0)
|
|
259
|
+
sub_span.set_attribute(SpanAttributes.LLM_TOKEN_COUNT_TOTAL,
|
|
260
|
+
usage_info.token_usage.total_tokens if usage_info.token_usage else 0)
|
|
261
|
+
|
|
262
|
+
if step.payload.data and step.payload.data.output is not None:
|
|
263
|
+
serialized_output, is_json = self._serialize_payload(step.payload.data.output)
|
|
264
|
+
sub_span.set_attribute(SpanAttributes.OUTPUT_VALUE, serialized_output)
|
|
265
|
+
sub_span.set_attribute(SpanAttributes.OUTPUT_MIME_TYPE, "application/json" if is_json else "text/plain")
|
|
266
|
+
|
|
267
|
+
end_ns = _ns_timestamp(step.payload.event_timestamp)
|
|
268
|
+
|
|
269
|
+
# End the subspan
|
|
270
|
+
sub_span.end(end_time=end_ns)
|