aiqtoolkit 1.1.0a20250515__py3-none-any.whl → 1.1.0a20251020__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of aiqtoolkit might be problematic. Click here for more details.
- aiqtoolkit-1.1.0a20251020.dist-info/METADATA +37 -0
- aiqtoolkit-1.1.0a20251020.dist-info/RECORD +4 -0
- {aiqtoolkit-1.1.0a20250515.dist-info → aiqtoolkit-1.1.0a20251020.dist-info}/WHEEL +1 -1
- aiqtoolkit-1.1.0a20251020.dist-info/top_level.txt +1 -0
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +0 -76
- aiq/agent/dual_node.py +0 -67
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +0 -322
- aiq/agent/react_agent/output_parser.py +0 -104
- aiq/agent/react_agent/prompt.py +0 -46
- aiq/agent/react_agent/register.py +0 -148
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +0 -224
- aiq/agent/register.py +0 -23
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +0 -410
- aiq/agent/rewoo_agent/prompt.py +0 -108
- aiq/agent/rewoo_agent/register.py +0 -158
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +0 -123
- aiq/agent/tool_calling_agent/register.py +0 -105
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +0 -223
- aiq/builder/component_utils.py +0 -303
- aiq/builder/context.py +0 -227
- aiq/builder/embedder.py +0 -24
- aiq/builder/eval_builder.py +0 -120
- aiq/builder/evaluator.py +0 -29
- aiq/builder/framework_enum.py +0 -24
- aiq/builder/front_end.py +0 -73
- aiq/builder/function.py +0 -297
- aiq/builder/function_base.py +0 -376
- aiq/builder/function_info.py +0 -627
- aiq/builder/intermediate_step_manager.py +0 -135
- aiq/builder/llm.py +0 -25
- aiq/builder/retriever.py +0 -25
- aiq/builder/user_interaction_manager.py +0 -71
- aiq/builder/workflow.py +0 -143
- aiq/builder/workflow_builder.py +0 -757
- aiq/cli/__init__.py +0 -14
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +0 -231
- aiq/cli/cli_utils/validation.py +0 -37
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +0 -28
- aiq/cli/commands/configure/channel/channel.py +0 -36
- aiq/cli/commands/configure/channel/remove.py +0 -30
- aiq/cli/commands/configure/channel/update.py +0 -30
- aiq/cli/commands/configure/configure.py +0 -33
- aiq/cli/commands/evaluate.py +0 -139
- aiq/cli/commands/info/__init__.py +0 -14
- aiq/cli/commands/info/info.py +0 -39
- aiq/cli/commands/info/list_channels.py +0 -32
- aiq/cli/commands/info/list_components.py +0 -129
- aiq/cli/commands/info/list_mcp.py +0 -126
- aiq/cli/commands/registry/__init__.py +0 -14
- aiq/cli/commands/registry/publish.py +0 -88
- aiq/cli/commands/registry/pull.py +0 -118
- aiq/cli/commands/registry/registry.py +0 -38
- aiq/cli/commands/registry/remove.py +0 -108
- aiq/cli/commands/registry/search.py +0 -155
- aiq/cli/commands/start.py +0 -250
- aiq/cli/commands/uninstall.py +0 -83
- aiq/cli/commands/validate.py +0 -47
- aiq/cli/commands/workflow/__init__.py +0 -14
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
- aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
- aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
- aiq/cli/commands/workflow/workflow.py +0 -37
- aiq/cli/commands/workflow/workflow_commands.py +0 -313
- aiq/cli/entrypoint.py +0 -133
- aiq/cli/main.py +0 -44
- aiq/cli/register_workflow.py +0 -408
- aiq/cli/type_registry.py +0 -879
- aiq/data_models/__init__.py +0 -14
- aiq/data_models/api_server.py +0 -588
- aiq/data_models/common.py +0 -143
- aiq/data_models/component.py +0 -46
- aiq/data_models/component_ref.py +0 -135
- aiq/data_models/config.py +0 -349
- aiq/data_models/dataset_handler.py +0 -122
- aiq/data_models/discovery_metadata.py +0 -286
- aiq/data_models/embedder.py +0 -26
- aiq/data_models/evaluate.py +0 -104
- aiq/data_models/evaluator.py +0 -26
- aiq/data_models/front_end.py +0 -26
- aiq/data_models/function.py +0 -30
- aiq/data_models/function_dependencies.py +0 -64
- aiq/data_models/interactive.py +0 -237
- aiq/data_models/intermediate_step.py +0 -269
- aiq/data_models/invocation_node.py +0 -38
- aiq/data_models/llm.py +0 -26
- aiq/data_models/logging.py +0 -26
- aiq/data_models/memory.py +0 -26
- aiq/data_models/profiler.py +0 -53
- aiq/data_models/registry_handler.py +0 -26
- aiq/data_models/retriever.py +0 -30
- aiq/data_models/step_adaptor.py +0 -64
- aiq/data_models/streaming.py +0 -33
- aiq/data_models/swe_bench_model.py +0 -54
- aiq/data_models/telemetry_exporter.py +0 -26
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +0 -41
- aiq/embedder/nim_embedder.py +0 -58
- aiq/embedder/openai_embedder.py +0 -42
- aiq/embedder/register.py +0 -24
- aiq/eval/__init__.py +0 -14
- aiq/eval/config.py +0 -42
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +0 -106
- aiq/eval/dataset_handler/dataset_filter.py +0 -52
- aiq/eval/dataset_handler/dataset_handler.py +0 -169
- aiq/eval/evaluate.py +0 -325
- aiq/eval/evaluator/__init__.py +0 -14
- aiq/eval/evaluator/evaluator_model.py +0 -44
- aiq/eval/intermediate_step_adapter.py +0 -93
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +0 -138
- aiq/eval/rag_evaluator/register.py +0 -138
- aiq/eval/register.py +0 -23
- aiq/eval/remote_workflow.py +0 -128
- aiq/eval/runtime_event_subscriber.py +0 -52
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
- aiq/eval/swe_bench_evaluator/register.py +0 -36
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +0 -118
- aiq/eval/trajectory_evaluator/register.py +0 -40
- aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
- aiq/eval/tunable_rag_evaluator/evaluate.py +0 -263
- aiq/eval/tunable_rag_evaluator/register.py +0 -50
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +0 -131
- aiq/eval/utils/tqdm_position_registry.py +0 -40
- aiq/front_ends/__init__.py +0 -14
- aiq/front_ends/console/__init__.py +0 -14
- aiq/front_ends/console/console_front_end_config.py +0 -32
- aiq/front_ends/console/console_front_end_plugin.py +0 -107
- aiq/front_ends/console/register.py +0 -25
- aiq/front_ends/cron/__init__.py +0 -14
- aiq/front_ends/fastapi/__init__.py +0 -14
- aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -150
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -103
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -607
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
- aiq/front_ends/fastapi/job_store.py +0 -161
- aiq/front_ends/fastapi/main.py +0 -70
- aiq/front_ends/fastapi/message_handler.py +0 -279
- aiq/front_ends/fastapi/message_validator.py +0 -345
- aiq/front_ends/fastapi/register.py +0 -25
- aiq/front_ends/fastapi/response_helpers.py +0 -195
- aiq/front_ends/fastapi/step_adaptor.py +0 -320
- aiq/front_ends/fastapi/websocket.py +0 -148
- aiq/front_ends/mcp/__init__.py +0 -14
- aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
- aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
- aiq/front_ends/mcp/register.py +0 -27
- aiq/front_ends/mcp/tool_converter.py +0 -242
- aiq/front_ends/register.py +0 -22
- aiq/front_ends/simple_base/__init__.py +0 -14
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -52
- aiq/llm/__init__.py +0 -0
- aiq/llm/nim_llm.py +0 -45
- aiq/llm/openai_llm.py +0 -45
- aiq/llm/register.py +0 -22
- aiq/llm/utils/__init__.py +0 -14
- aiq/llm/utils/env_config_value.py +0 -94
- aiq/llm/utils/error.py +0 -17
- aiq/memory/__init__.py +0 -20
- aiq/memory/interfaces.py +0 -183
- aiq/memory/models.py +0 -112
- aiq/meta/module_to_distro.json +0 -3
- aiq/meta/pypi.md +0 -58
- aiq/observability/__init__.py +0 -0
- aiq/observability/async_otel_listener.py +0 -429
- aiq/observability/register.py +0 -99
- aiq/plugins/.namespace +0 -1
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +0 -295
- aiq/profiler/callbacks/base_callback_class.py +0 -20
- aiq/profiler/callbacks/langchain_callback_handler.py +0 -278
- aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
- aiq/profiler/callbacks/token_usage_base_model.py +0 -27
- aiq/profiler/data_frame_row.py +0 -51
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +0 -131
- aiq/profiler/decorators/function_tracking.py +0 -254
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +0 -18
- aiq/profiler/forecasting/model_trainer.py +0 -75
- aiq/profiler/forecasting/models/__init__.py +0 -22
- aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
- aiq/profiler/forecasting/models/linear_model.py +0 -196
- aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
- aiq/profiler/inference_metrics_model.py +0 -25
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -452
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
- aiq/profiler/inference_optimization/data_models.py +0 -386
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
- aiq/profiler/inference_optimization/llm_metrics.py +0 -212
- aiq/profiler/inference_optimization/prompt_caching.py +0 -163
- aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
- aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
- aiq/profiler/intermediate_property_adapter.py +0 -102
- aiq/profiler/profile_runner.py +0 -433
- aiq/profiler/utils.py +0 -184
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +0 -176
- aiq/registry_handlers/local/register_local.py +0 -37
- aiq/registry_handlers/metadata_factory.py +0 -60
- aiq/registry_handlers/package_utils.py +0 -198
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +0 -251
- aiq/registry_handlers/pypi/register_pypi.py +0 -40
- aiq/registry_handlers/register.py +0 -21
- aiq/registry_handlers/registry_handler_base.py +0 -157
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +0 -56
- aiq/registry_handlers/rest/rest_handler.py +0 -237
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +0 -42
- aiq/registry_handlers/schemas/package.py +0 -68
- aiq/registry_handlers/schemas/publish.py +0 -63
- aiq/registry_handlers/schemas/pull.py +0 -82
- aiq/registry_handlers/schemas/remove.py +0 -36
- aiq/registry_handlers/schemas/search.py +0 -91
- aiq/registry_handlers/schemas/status.py +0 -47
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +0 -37
- aiq/retriever/milvus/__init__.py +0 -14
- aiq/retriever/milvus/register.py +0 -81
- aiq/retriever/milvus/retriever.py +0 -228
- aiq/retriever/models.py +0 -74
- aiq/retriever/nemo_retriever/__init__.py +0 -14
- aiq/retriever/nemo_retriever/register.py +0 -60
- aiq/retriever/nemo_retriever/retriever.py +0 -190
- aiq/retriever/register.py +0 -22
- aiq/runtime/__init__.py +0 -14
- aiq/runtime/loader.py +0 -188
- aiq/runtime/runner.py +0 -176
- aiq/runtime/session.py +0 -140
- aiq/runtime/user_metadata.py +0 -131
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +0 -318
- aiq/test/.namespace +0 -1
- aiq/tool/__init__.py +0 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +0 -188
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
- aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -83
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -4
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -25
- aiq/tool/code_execution/register.py +0 -70
- aiq/tool/code_execution/utils.py +0 -100
- aiq/tool/datetime_tools.py +0 -42
- aiq/tool/document_search.py +0 -141
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +0 -133
- aiq/tool/github_tools/create_github_issue.py +0 -87
- aiq/tool/github_tools/create_github_pr.py +0 -106
- aiq/tool/github_tools/get_github_file.py +0 -106
- aiq/tool/github_tools/get_github_issue.py +0 -166
- aiq/tool/github_tools/get_github_pr.py +0 -256
- aiq/tool/github_tools/update_github_issue.py +0 -100
- aiq/tool/mcp/__init__.py +0 -14
- aiq/tool/mcp/mcp_client.py +0 -220
- aiq/tool/mcp/mcp_tool.py +0 -95
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +0 -79
- aiq/tool/memory_tools/delete_memory_tool.py +0 -67
- aiq/tool/memory_tools/get_memory_tool.py +0 -72
- aiq/tool/nvidia_rag.py +0 -95
- aiq/tool/register.py +0 -37
- aiq/tool/retriever.py +0 -89
- aiq/tool/server_tools.py +0 -63
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +0 -58
- aiq/utils/debugging_utils.py +0 -43
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/schemas.py +0 -114
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/yaml_tools.py +0 -119
- aiq/utils/metadata_utils.py +0 -74
- aiq/utils/optional_imports.py +0 -142
- aiq/utils/producer_consumer_queue.py +0 -178
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +0 -65
- aiq/utils/reactive/base/observer_base.py +0 -55
- aiq/utils/reactive/base/subject_base.py +0 -79
- aiq/utils/reactive/observable.py +0 -59
- aiq/utils/reactive/observer.py +0 -76
- aiq/utils/reactive/subject.py +0 -131
- aiq/utils/reactive/subscription.py +0 -49
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +0 -197
- aiq/utils/type_converter.py +0 -232
- aiq/utils/type_utils.py +0 -397
- aiq/utils/url_utils.py +0 -27
- aiqtoolkit-1.1.0a20250515.dist-info/METADATA +0 -331
- aiqtoolkit-1.1.0a20250515.dist-info/RECORD +0 -316
- aiqtoolkit-1.1.0a20250515.dist-info/entry_points.txt +0 -17
- aiqtoolkit-1.1.0a20250515.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
- aiqtoolkit-1.1.0a20250515.dist-info/licenses/LICENSE.md +0 -201
- aiqtoolkit-1.1.0a20250515.dist-info/top_level.txt +0 -1
|
@@ -1,26 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import typing
|
|
17
|
-
|
|
18
|
-
from .common import BaseModelRegistryTag
|
|
19
|
-
from .common import TypedBaseModel
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
class RegistryHandlerBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
-
pass
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
RegistryHandlerBaseConfigT = typing.TypeVar("RegistryHandlerBaseConfigT", bound=RegistryHandlerBaseConfig)
|
aiq/data_models/retriever.py
DELETED
|
@@ -1,30 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import typing
|
|
17
|
-
|
|
18
|
-
from aiq.data_models.common import BaseModelRegistryTag
|
|
19
|
-
from aiq.data_models.common import TypedBaseModel
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
class RetrieverBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
-
"""
|
|
24
|
-
The base level config object for a retriever object. Retrievers use different provider clients (e.g., Milvus) to
|
|
25
|
-
provide an interface for searching for and retrieving documents from the configured data store.
|
|
26
|
-
"""
|
|
27
|
-
pass
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
RetrieverBaseConfigT = typing.TypeVar("RetrieverBaseConfigT", bound=RetrieverBaseConfig)
|
aiq/data_models/step_adaptor.py
DELETED
|
@@ -1,64 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import logging
|
|
17
|
-
from enum import Enum
|
|
18
|
-
|
|
19
|
-
from pydantic import BaseModel
|
|
20
|
-
from pydantic import Field
|
|
21
|
-
from pydantic import model_validator
|
|
22
|
-
|
|
23
|
-
from aiq.data_models.intermediate_step import IntermediateStepType
|
|
24
|
-
|
|
25
|
-
logger = logging.getLogger(__name__)
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
class StepAdaptorMode(str, Enum):
|
|
29
|
-
DEFAULT = "default"
|
|
30
|
-
CUSTOM = "custom"
|
|
31
|
-
OFF = "off"
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
class StepAdaptorConfig(BaseModel):
|
|
35
|
-
"""
|
|
36
|
-
Configures how intermediate steps are filtered and normalized by the StepAdaptor.
|
|
37
|
-
|
|
38
|
-
Args:
|
|
39
|
-
mode (StepAdaptorMode): One of:
|
|
40
|
-
- 'current' => pass only LLM (all LLM_* events) + TOOL_END
|
|
41
|
-
- 'end_events_only' => pass only LLM_END and TOOL_END
|
|
42
|
-
- 'custom' => pass only the events in custom_event_types
|
|
43
|
-
custom_event_types (list[IntermediateStepType]):
|
|
44
|
-
If mode == 'custom', we only pass events whose event_type is in this list.
|
|
45
|
-
Otherwise, this field is ignored.
|
|
46
|
-
"""
|
|
47
|
-
mode: StepAdaptorMode = StepAdaptorMode.DEFAULT
|
|
48
|
-
custom_event_types: list[IntermediateStepType] = Field(default_factory=list)
|
|
49
|
-
|
|
50
|
-
@model_validator(mode="after")
|
|
51
|
-
def check_custom_event_types(self) -> "StepAdaptorConfig":
|
|
52
|
-
"""
|
|
53
|
-
Validates custom configurations
|
|
54
|
-
"""
|
|
55
|
-
if self.mode != StepAdaptorMode.CUSTOM and self.custom_event_types:
|
|
56
|
-
logger.warning("Ignoring custom_event_types because mode is not 'custom'")
|
|
57
|
-
self.custom_event_types = []
|
|
58
|
-
elif self.mode == StepAdaptorMode.CUSTOM and not self.custom_event_types:
|
|
59
|
-
logger.warning("No custom_event_types provided for custom mode. Defaulting to CUSTOM_START and CUSTOM_END")
|
|
60
|
-
self.custom_event_types = [IntermediateStepType.CUSTOM_START, IntermediateStepType.CUSTOM_END]
|
|
61
|
-
elif self.mode == StepAdaptorMode.OFF:
|
|
62
|
-
logger.warning("StepAdaptor is disabled. Ignoring all intermediate event types")
|
|
63
|
-
self.custom_event_types = []
|
|
64
|
-
return self
|
aiq/data_models/streaming.py
DELETED
|
@@ -1,33 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import inspect
|
|
17
|
-
import typing
|
|
18
|
-
from collections.abc import Callable
|
|
19
|
-
|
|
20
|
-
_T = typing.TypeVar("_T")
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
class Streaming(typing.Generic[_T]):
|
|
24
|
-
|
|
25
|
-
def __init__(self, *, convert: Callable[[typing.Any], _T] = None):
|
|
26
|
-
self.convert = convert
|
|
27
|
-
|
|
28
|
-
sig = inspect.signature(self.convert)
|
|
29
|
-
|
|
30
|
-
if (sig.return_annotation == inspect.Parameter.empty):
|
|
31
|
-
raise ValueError("convert must have a return annotation")
|
|
32
|
-
|
|
33
|
-
self.single_output_type = sig.return_annotation
|
|
@@ -1,54 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import json
|
|
17
|
-
|
|
18
|
-
from pydantic import BaseModel
|
|
19
|
-
from pydantic import ConfigDict
|
|
20
|
-
from pydantic import field_validator
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
class SWEBenchInput(BaseModel):
|
|
24
|
-
# Allow extra fields in the model_config to support derived models
|
|
25
|
-
model_config = ConfigDict(extra="allow")
|
|
26
|
-
|
|
27
|
-
repo: str
|
|
28
|
-
instance_id: str
|
|
29
|
-
base_commit: str
|
|
30
|
-
patch: str
|
|
31
|
-
test_patch: str
|
|
32
|
-
problem_statement: str
|
|
33
|
-
hints_text: str
|
|
34
|
-
created_at: str | int
|
|
35
|
-
version: float
|
|
36
|
-
FAIL_TO_PASS: list[str]
|
|
37
|
-
PASS_TO_PASS: list[str]
|
|
38
|
-
environment_setup_commit: str
|
|
39
|
-
|
|
40
|
-
# Handle improperly formatted JSON strings for list fields
|
|
41
|
-
@field_validator("FAIL_TO_PASS", "PASS_TO_PASS", mode="before")
|
|
42
|
-
def parse_list_fields(cls, value): # pylint: disable=no-self-argument
|
|
43
|
-
if isinstance(value, str):
|
|
44
|
-
# Attempt to parse the string as a list
|
|
45
|
-
return json.loads(value)
|
|
46
|
-
return value
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
class SWEBenchOutput(BaseModel):
|
|
50
|
-
model_config = ConfigDict(protected_namespaces=(), populate_by_name=True)
|
|
51
|
-
|
|
52
|
-
instance_id: str
|
|
53
|
-
model_name_or_path: str
|
|
54
|
-
model_patch: str
|
|
@@ -1,26 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import typing
|
|
17
|
-
|
|
18
|
-
from .common import BaseModelRegistryTag
|
|
19
|
-
from .common import TypedBaseModel
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
class TelemetryExporterBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
-
pass
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
TelemetryExporterConfigT = typing.TypeVar("TelemetryExporterConfigT", bound=TelemetryExporterBaseConfig)
|
aiq/embedder/__init__.py
DELETED
|
File without changes
|
aiq/embedder/langchain_client.py
DELETED
|
@@ -1,41 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
from aiq.builder.builder import Builder
|
|
17
|
-
from aiq.builder.framework_enum import LLMFrameworkEnum
|
|
18
|
-
from aiq.cli.register_workflow import register_embedder_client
|
|
19
|
-
from aiq.embedder.nim_embedder import NIMEmbedderModelConfig
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
@register_embedder_client(config_type=NIMEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
23
|
-
async def nim_langchain(embedder_config: NIMEmbedderModelConfig, builder: Builder):
|
|
24
|
-
|
|
25
|
-
from langchain_nvidia_ai_endpoints import NVIDIAEmbeddings
|
|
26
|
-
|
|
27
|
-
yield NVIDIAEmbeddings(**embedder_config.model_dump(exclude={"type"}, by_alias=True))
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
@register_embedder_client(config_type=NIMEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
|
|
31
|
-
async def nim_llamaindex(embedder_config: NIMEmbedderModelConfig, builder: Builder):
|
|
32
|
-
|
|
33
|
-
from llama_index.embeddings.nvidia import NVIDIAEmbedding # pylint: disable=no-name-in-module
|
|
34
|
-
|
|
35
|
-
config_obj = {
|
|
36
|
-
**embedder_config.model_dump(exclude={"type", "model_name"}, by_alias=True),
|
|
37
|
-
"model":
|
|
38
|
-
embedder_config.model_name,
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
yield NVIDIAEmbedding(**config_obj)
|
aiq/embedder/nim_embedder.py
DELETED
|
@@ -1,58 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import typing
|
|
17
|
-
|
|
18
|
-
from pydantic import AfterValidator
|
|
19
|
-
from pydantic import AliasChoices
|
|
20
|
-
from pydantic import ConfigDict
|
|
21
|
-
from pydantic import Field
|
|
22
|
-
|
|
23
|
-
from aiq.builder.builder import Builder
|
|
24
|
-
from aiq.builder.embedder import EmbedderProviderInfo
|
|
25
|
-
from aiq.cli.register_workflow import register_embedder_provider
|
|
26
|
-
from aiq.data_models.embedder import EmbedderBaseConfig
|
|
27
|
-
|
|
28
|
-
allowed_truncate_values = ["NONE", "START", "END"]
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
def option_in_allowed_values(v):
|
|
32
|
-
"""Ensures option is allowed"""
|
|
33
|
-
assert v in allowed_truncate_values
|
|
34
|
-
return v
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
TruncationOption = typing.Annotated[str, AfterValidator(option_in_allowed_values)]
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
class NIMEmbedderModelConfig(EmbedderBaseConfig, name="nim"):
|
|
41
|
-
"""A NVIDIA Inference Microservice (NIM) embedder provider to be used with an embedder client."""
|
|
42
|
-
|
|
43
|
-
api_key: str | None = Field(default=None, description="NVIDIA API key to interact with hosted NIM.")
|
|
44
|
-
base_url: str | None = Field(default=None, description="Base url to the hosted NIM.")
|
|
45
|
-
model_name: str = Field(validation_alias=AliasChoices("model_name", "model"),
|
|
46
|
-
serialization_alias="model",
|
|
47
|
-
description="The model name for the hosted NIM.")
|
|
48
|
-
truncate: TruncationOption = Field(default="NONE",
|
|
49
|
-
description=("The truncation strategy if the input on the "
|
|
50
|
-
"server side if it's too large."))
|
|
51
|
-
|
|
52
|
-
model_config = ConfigDict(protected_namespaces=())
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
@register_embedder_provider(config_type=NIMEmbedderModelConfig)
|
|
56
|
-
async def nim_embedder_model(embedder_config: NIMEmbedderModelConfig, builder: Builder):
|
|
57
|
-
|
|
58
|
-
yield EmbedderProviderInfo(config=embedder_config, description="A NIM model for use with an Embedder client.")
|
aiq/embedder/openai_embedder.py
DELETED
|
@@ -1,42 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
from pydantic import AliasChoices
|
|
17
|
-
from pydantic import ConfigDict
|
|
18
|
-
from pydantic import Field
|
|
19
|
-
|
|
20
|
-
from aiq.builder.builder import Builder
|
|
21
|
-
from aiq.builder.embedder import EmbedderProviderInfo
|
|
22
|
-
from aiq.cli.register_workflow import register_embedder_provider
|
|
23
|
-
from aiq.data_models.embedder import EmbedderBaseConfig
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
class OpenAIEmbedderModelConfig(EmbedderBaseConfig, name="openai"):
|
|
27
|
-
"""An OpenAI LLM provider to be used with an LLM client."""
|
|
28
|
-
|
|
29
|
-
model_config = ConfigDict(protected_namespaces=())
|
|
30
|
-
|
|
31
|
-
api_key: str | None = Field(default=None, description="OpenAI API key to interact with hosted model.")
|
|
32
|
-
base_url: str | None = Field(default=None, description="Base url to the hosted model.")
|
|
33
|
-
model_name: str = Field(validation_alias=AliasChoices("model_name", "model"),
|
|
34
|
-
serialization_alias="model",
|
|
35
|
-
description="The OpenAI hosted model name.")
|
|
36
|
-
max_retries: int = Field(default=2, description="The max number of retries for the request.")
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
@register_embedder_provider(config_type=OpenAIEmbedderModelConfig)
|
|
40
|
-
async def openai_llm(config: OpenAIEmbedderModelConfig, builder: Builder):
|
|
41
|
-
|
|
42
|
-
yield EmbedderProviderInfo(config=config, description="An OpenAI model for use with an Embedder client.")
|
aiq/embedder/register.py
DELETED
|
@@ -1,24 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
# pylint: disable=unused-import
|
|
17
|
-
# flake8: noqa
|
|
18
|
-
# isort:skip_file
|
|
19
|
-
|
|
20
|
-
# Import any providers which need to be automatically registered here
|
|
21
|
-
from . import nim_embedder
|
|
22
|
-
from . import openai_embedder
|
|
23
|
-
# Import any clients which need to be automatically registered here
|
|
24
|
-
from . import langchain_client
|
aiq/eval/__init__.py
DELETED
|
@@ -1,14 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
aiq/eval/config.py
DELETED
|
@@ -1,42 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
from pathlib import Path
|
|
17
|
-
|
|
18
|
-
from pydantic import BaseModel
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
class EvaluationRunConfig(BaseModel):
|
|
22
|
-
"""
|
|
23
|
-
Parameters used for a single evaluation run.
|
|
24
|
-
"""
|
|
25
|
-
config_file: Path
|
|
26
|
-
dataset: str | None # dataset file path can be specified in the config file
|
|
27
|
-
result_json_path: str = "$"
|
|
28
|
-
skip_workflow: bool = False
|
|
29
|
-
skip_completed_entries: bool = False
|
|
30
|
-
endpoint: str | None = None # only used when running the workflow remotely
|
|
31
|
-
endpoint_timeout: int = 300
|
|
32
|
-
reps: int = 1
|
|
33
|
-
override: tuple[tuple[str, str], ...] = ()
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
class EvaluationRunOutput(BaseModel):
|
|
37
|
-
"""
|
|
38
|
-
Output of a single evaluation run.
|
|
39
|
-
"""
|
|
40
|
-
workflow_output_file: Path | None
|
|
41
|
-
evaluator_output_files: list[Path]
|
|
42
|
-
workflow_interrupted: bool
|
|
File without changes
|
|
@@ -1,106 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
import logging
|
|
16
|
-
from pathlib import Path
|
|
17
|
-
|
|
18
|
-
import boto3
|
|
19
|
-
import requests
|
|
20
|
-
from botocore.exceptions import NoCredentialsError
|
|
21
|
-
|
|
22
|
-
from aiq.data_models.dataset_handler import EvalDatasetConfig
|
|
23
|
-
|
|
24
|
-
logger = logging.getLogger(__name__)
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
class DatasetDownloader:
|
|
28
|
-
"""
|
|
29
|
-
Download remote datasets using signed URLs or S3 credentials.
|
|
30
|
-
|
|
31
|
-
One DatasetDownloader object is needed for each dataset to be downloaded.
|
|
32
|
-
"""
|
|
33
|
-
|
|
34
|
-
def __init__(self, dataset_config: EvalDatasetConfig):
|
|
35
|
-
self.dataset_config = dataset_config
|
|
36
|
-
self._s3_client = None
|
|
37
|
-
|
|
38
|
-
@property
|
|
39
|
-
def s3_config(self):
|
|
40
|
-
return self.dataset_config.s3
|
|
41
|
-
|
|
42
|
-
@property
|
|
43
|
-
def s3_client(self):
|
|
44
|
-
"""Lazy init the S3 client."""
|
|
45
|
-
if not self._s3_client:
|
|
46
|
-
try:
|
|
47
|
-
self._s3_client = boto3.client("s3",
|
|
48
|
-
endpoint_url=self.s3_config.endpoint_url,
|
|
49
|
-
aws_access_key_id=self.s3_config.access_key,
|
|
50
|
-
aws_secret_access_key=self.s3_config.secret_key)
|
|
51
|
-
except NoCredentialsError as e:
|
|
52
|
-
logger.error("AWS credentials not available: %s", e)
|
|
53
|
-
raise
|
|
54
|
-
except Exception as e:
|
|
55
|
-
logger.error("Failed to initialize S3 client: %s", e)
|
|
56
|
-
raise
|
|
57
|
-
return self._s3_client
|
|
58
|
-
|
|
59
|
-
@staticmethod
|
|
60
|
-
def ensure_directory_exists(file_path: str):
|
|
61
|
-
"""Ensure the directory for the file exists."""
|
|
62
|
-
Path(file_path).parent.mkdir(parents=True, exist_ok=True)
|
|
63
|
-
|
|
64
|
-
def download_with_signed_url(self, remote_file_path: str, local_file_path: str, timeout: int = 300):
|
|
65
|
-
"""Download a file using a signed URL."""
|
|
66
|
-
try:
|
|
67
|
-
response = requests.get(remote_file_path, stream=True, timeout=timeout)
|
|
68
|
-
response.raise_for_status()
|
|
69
|
-
with open(local_file_path, "wb") as file:
|
|
70
|
-
for chunk in response.iter_content(chunk_size=8192):
|
|
71
|
-
file.write(chunk)
|
|
72
|
-
logger.info("File downloaded successfully to %s using signed URL.", local_file_path)
|
|
73
|
-
except requests.exceptions.RequestException as e:
|
|
74
|
-
logger.error("Error downloading file using signed URL: %s", e)
|
|
75
|
-
raise
|
|
76
|
-
|
|
77
|
-
def download_with_boto3(self, remote_file_path: str, local_file_path: str):
|
|
78
|
-
"""Download a file using boto3 and credentials."""
|
|
79
|
-
try:
|
|
80
|
-
self.s3_client.download_file(self.dataset_config.s3.bucket, remote_file_path, local_file_path)
|
|
81
|
-
logger.info("File downloaded successfully to %s using S3 client.", local_file_path)
|
|
82
|
-
except Exception as e:
|
|
83
|
-
logger.error("Error downloading file from S3: %s", e)
|
|
84
|
-
raise
|
|
85
|
-
|
|
86
|
-
@staticmethod
|
|
87
|
-
def is_file_path_url(file_path: str) -> bool:
|
|
88
|
-
"""Check if the file path is a URL."""
|
|
89
|
-
return file_path.startswith("http")
|
|
90
|
-
|
|
91
|
-
def download_file(self, remote_file_path: str, local_file_path: str):
|
|
92
|
-
"""Download a file using the appropriate method."""
|
|
93
|
-
self.ensure_directory_exists(local_file_path)
|
|
94
|
-
if self.is_file_path_url(remote_file_path):
|
|
95
|
-
logger.info("Using signed URL to download the file %s...", remote_file_path)
|
|
96
|
-
self.download_with_signed_url(remote_file_path, local_file_path, timeout=120)
|
|
97
|
-
else:
|
|
98
|
-
logger.info("Using S3 credentials to download the file %s...", remote_file_path)
|
|
99
|
-
self.download_with_boto3(remote_file_path, local_file_path)
|
|
100
|
-
|
|
101
|
-
def download_dataset(self):
|
|
102
|
-
"""Download datasets defined in the evaluation configuration."""
|
|
103
|
-
if self.dataset_config.remote_file_path:
|
|
104
|
-
logger.info("Downloading remote dataset %s")
|
|
105
|
-
self.download_file(remote_file_path=self.dataset_config.remote_file_path,
|
|
106
|
-
local_file_path=self.dataset_config.file_path)
|
|
@@ -1,52 +0,0 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
-
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
-
#
|
|
4
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
-
# you may not use this file except in compliance with the License.
|
|
6
|
-
# You may obtain a copy of the License at
|
|
7
|
-
#
|
|
8
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
-
#
|
|
10
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
-
# See the License for the specific language governing permissions and
|
|
14
|
-
# limitations under the License.
|
|
15
|
-
|
|
16
|
-
import pandas as pd
|
|
17
|
-
|
|
18
|
-
from aiq.data_models.dataset_handler import EvalFilterConfig
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
class DatasetFilter:
|
|
22
|
-
"""
|
|
23
|
-
Apply allowlist and denylist filters to the DataFrame based on specified column filters.
|
|
24
|
-
- If a allowlist is provided, only keep rows matching the filter values.
|
|
25
|
-
- If a denylist is provided, remove rows matching the filter values.
|
|
26
|
-
- If the filter column does not exist in the DataFrame, the filtering is skipped for that column.
|
|
27
|
-
|
|
28
|
-
This is a utility class that is dataset agnostic and can be used to filter any DataFrame based on the provided
|
|
29
|
-
filter configuration.
|
|
30
|
-
"""
|
|
31
|
-
|
|
32
|
-
def __init__(self, filter_config: EvalFilterConfig):
|
|
33
|
-
|
|
34
|
-
self.filter_config = filter_config
|
|
35
|
-
|
|
36
|
-
def apply_filters(self, df) -> pd.DataFrame:
|
|
37
|
-
|
|
38
|
-
filtered_df = df.copy()
|
|
39
|
-
|
|
40
|
-
# Apply allowlist (only keep specified rows)
|
|
41
|
-
if self.filter_config.allowlist:
|
|
42
|
-
for column, values in self.filter_config.allowlist.field.items():
|
|
43
|
-
if column in filtered_df.columns:
|
|
44
|
-
filtered_df = filtered_df[filtered_df[column].isin(values)]
|
|
45
|
-
|
|
46
|
-
# Apply denylist (remove specified rows)
|
|
47
|
-
if self.filter_config.denylist:
|
|
48
|
-
for column, values in self.filter_config.denylist.field.items():
|
|
49
|
-
if column in filtered_df.columns:
|
|
50
|
-
filtered_df = filtered_df[~filtered_df[column].isin(values)]
|
|
51
|
-
|
|
52
|
-
return filtered_df
|