nvidia-nat 1.2.0rc5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +239 -0
- aiq/agent/dual_node.py +67 -0
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +355 -0
- aiq/agent/react_agent/output_parser.py +104 -0
- aiq/agent/react_agent/prompt.py +41 -0
- aiq/agent/react_agent/register.py +149 -0
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
- aiq/agent/register.py +23 -0
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +411 -0
- aiq/agent/rewoo_agent/prompt.py +108 -0
- aiq/agent/rewoo_agent/register.py +158 -0
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +119 -0
- aiq/agent/tool_calling_agent/register.py +106 -0
- aiq/authentication/__init__.py +14 -0
- aiq/authentication/api_key/__init__.py +14 -0
- aiq/authentication/api_key/api_key_auth_provider.py +96 -0
- aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
- aiq/authentication/api_key/register.py +26 -0
- aiq/authentication/exceptions/__init__.py +14 -0
- aiq/authentication/exceptions/api_key_exceptions.py +38 -0
- aiq/authentication/http_basic_auth/__init__.py +0 -0
- aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- aiq/authentication/http_basic_auth/register.py +30 -0
- aiq/authentication/interfaces.py +93 -0
- aiq/authentication/oauth2/__init__.py +14 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- aiq/authentication/oauth2/register.py +25 -0
- aiq/authentication/register.py +21 -0
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +285 -0
- aiq/builder/component_utils.py +316 -0
- aiq/builder/context.py +264 -0
- aiq/builder/embedder.py +24 -0
- aiq/builder/eval_builder.py +161 -0
- aiq/builder/evaluator.py +29 -0
- aiq/builder/framework_enum.py +24 -0
- aiq/builder/front_end.py +73 -0
- aiq/builder/function.py +344 -0
- aiq/builder/function_base.py +380 -0
- aiq/builder/function_info.py +627 -0
- aiq/builder/intermediate_step_manager.py +174 -0
- aiq/builder/llm.py +25 -0
- aiq/builder/retriever.py +25 -0
- aiq/builder/user_interaction_manager.py +74 -0
- aiq/builder/workflow.py +148 -0
- aiq/builder/workflow_builder.py +1117 -0
- aiq/cli/__init__.py +14 -0
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +231 -0
- aiq/cli/cli_utils/validation.py +37 -0
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +28 -0
- aiq/cli/commands/configure/channel/channel.py +36 -0
- aiq/cli/commands/configure/channel/remove.py +30 -0
- aiq/cli/commands/configure/channel/update.py +30 -0
- aiq/cli/commands/configure/configure.py +33 -0
- aiq/cli/commands/evaluate.py +139 -0
- aiq/cli/commands/info/__init__.py +14 -0
- aiq/cli/commands/info/info.py +39 -0
- aiq/cli/commands/info/list_channels.py +32 -0
- aiq/cli/commands/info/list_components.py +129 -0
- aiq/cli/commands/info/list_mcp.py +213 -0
- aiq/cli/commands/registry/__init__.py +14 -0
- aiq/cli/commands/registry/publish.py +88 -0
- aiq/cli/commands/registry/pull.py +118 -0
- aiq/cli/commands/registry/registry.py +38 -0
- aiq/cli/commands/registry/remove.py +108 -0
- aiq/cli/commands/registry/search.py +155 -0
- aiq/cli/commands/sizing/__init__.py +14 -0
- aiq/cli/commands/sizing/calc.py +297 -0
- aiq/cli/commands/sizing/sizing.py +27 -0
- aiq/cli/commands/start.py +246 -0
- aiq/cli/commands/uninstall.py +81 -0
- aiq/cli/commands/validate.py +47 -0
- aiq/cli/commands/workflow/__init__.py +14 -0
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
- aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- aiq/cli/commands/workflow/workflow.py +37 -0
- aiq/cli/commands/workflow/workflow_commands.py +313 -0
- aiq/cli/entrypoint.py +135 -0
- aiq/cli/main.py +44 -0
- aiq/cli/register_workflow.py +488 -0
- aiq/cli/type_registry.py +1000 -0
- aiq/data_models/__init__.py +14 -0
- aiq/data_models/api_server.py +694 -0
- aiq/data_models/authentication.py +231 -0
- aiq/data_models/common.py +171 -0
- aiq/data_models/component.py +54 -0
- aiq/data_models/component_ref.py +168 -0
- aiq/data_models/config.py +406 -0
- aiq/data_models/dataset_handler.py +123 -0
- aiq/data_models/discovery_metadata.py +335 -0
- aiq/data_models/embedder.py +27 -0
- aiq/data_models/evaluate.py +127 -0
- aiq/data_models/evaluator.py +26 -0
- aiq/data_models/front_end.py +26 -0
- aiq/data_models/function.py +30 -0
- aiq/data_models/function_dependencies.py +72 -0
- aiq/data_models/interactive.py +246 -0
- aiq/data_models/intermediate_step.py +302 -0
- aiq/data_models/invocation_node.py +38 -0
- aiq/data_models/llm.py +27 -0
- aiq/data_models/logging.py +26 -0
- aiq/data_models/memory.py +27 -0
- aiq/data_models/object_store.py +44 -0
- aiq/data_models/profiler.py +54 -0
- aiq/data_models/registry_handler.py +26 -0
- aiq/data_models/retriever.py +30 -0
- aiq/data_models/retry_mixin.py +35 -0
- aiq/data_models/span.py +187 -0
- aiq/data_models/step_adaptor.py +64 -0
- aiq/data_models/streaming.py +33 -0
- aiq/data_models/swe_bench_model.py +54 -0
- aiq/data_models/telemetry_exporter.py +26 -0
- aiq/data_models/ttc_strategy.py +30 -0
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +41 -0
- aiq/embedder/nim_embedder.py +59 -0
- aiq/embedder/openai_embedder.py +43 -0
- aiq/embedder/register.py +24 -0
- aiq/eval/__init__.py +14 -0
- aiq/eval/config.py +60 -0
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +106 -0
- aiq/eval/dataset_handler/dataset_filter.py +52 -0
- aiq/eval/dataset_handler/dataset_handler.py +254 -0
- aiq/eval/evaluate.py +506 -0
- aiq/eval/evaluator/__init__.py +14 -0
- aiq/eval/evaluator/base_evaluator.py +73 -0
- aiq/eval/evaluator/evaluator_model.py +45 -0
- aiq/eval/intermediate_step_adapter.py +99 -0
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +178 -0
- aiq/eval/rag_evaluator/register.py +143 -0
- aiq/eval/register.py +23 -0
- aiq/eval/remote_workflow.py +133 -0
- aiq/eval/runners/__init__.py +14 -0
- aiq/eval/runners/config.py +39 -0
- aiq/eval/runners/multi_eval_runner.py +54 -0
- aiq/eval/runtime_event_subscriber.py +52 -0
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
- aiq/eval/swe_bench_evaluator/register.py +36 -0
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +75 -0
- aiq/eval/trajectory_evaluator/register.py +40 -0
- aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
- aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
- aiq/eval/tunable_rag_evaluator/register.py +52 -0
- aiq/eval/usage_stats.py +41 -0
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +140 -0
- aiq/eval/utils/tqdm_position_registry.py +40 -0
- aiq/eval/utils/weave_eval.py +184 -0
- aiq/experimental/__init__.py +0 -0
- aiq/experimental/decorators/__init__.py +0 -0
- aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
- aiq/experimental/test_time_compute/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- aiq/experimental/test_time_compute/functions/__init__.py +0 -0
- aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
- aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
- aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- aiq/experimental/test_time_compute/models/__init__.py +0 -0
- aiq/experimental/test_time_compute/models/editor_config.py +132 -0
- aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
- aiq/experimental/test_time_compute/models/search_config.py +120 -0
- aiq/experimental/test_time_compute/models/selection_config.py +154 -0
- aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
- aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
- aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
- aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
- aiq/experimental/test_time_compute/register.py +36 -0
- aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
- aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- aiq/experimental/test_time_compute/search/__init__.py +0 -0
- aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- aiq/experimental/test_time_compute/selection/__init__.py +0 -0
- aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- aiq/front_ends/__init__.py +14 -0
- aiq/front_ends/console/__init__.py +14 -0
- aiq/front_ends/console/authentication_flow_handler.py +233 -0
- aiq/front_ends/console/console_front_end_config.py +32 -0
- aiq/front_ends/console/console_front_end_plugin.py +96 -0
- aiq/front_ends/console/register.py +25 -0
- aiq/front_ends/cron/__init__.py +14 -0
- aiq/front_ends/fastapi/__init__.py +14 -0
- aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
- aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
- aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
- aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- aiq/front_ends/fastapi/job_store.py +183 -0
- aiq/front_ends/fastapi/main.py +72 -0
- aiq/front_ends/fastapi/message_handler.py +298 -0
- aiq/front_ends/fastapi/message_validator.py +345 -0
- aiq/front_ends/fastapi/register.py +25 -0
- aiq/front_ends/fastapi/response_helpers.py +195 -0
- aiq/front_ends/fastapi/step_adaptor.py +321 -0
- aiq/front_ends/mcp/__init__.py +14 -0
- aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
- aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
- aiq/front_ends/mcp/register.py +27 -0
- aiq/front_ends/mcp/tool_converter.py +242 -0
- aiq/front_ends/register.py +22 -0
- aiq/front_ends/simple_base/__init__.py +14 -0
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- aiq/llm/__init__.py +0 -0
- aiq/llm/aws_bedrock_llm.py +57 -0
- aiq/llm/nim_llm.py +46 -0
- aiq/llm/openai_llm.py +46 -0
- aiq/llm/register.py +23 -0
- aiq/llm/utils/__init__.py +14 -0
- aiq/llm/utils/env_config_value.py +94 -0
- aiq/llm/utils/error.py +17 -0
- aiq/memory/__init__.py +20 -0
- aiq/memory/interfaces.py +183 -0
- aiq/memory/models.py +112 -0
- aiq/meta/module_to_distro.json +3 -0
- aiq/meta/pypi.md +58 -0
- aiq/object_store/__init__.py +20 -0
- aiq/object_store/in_memory_object_store.py +76 -0
- aiq/object_store/interfaces.py +84 -0
- aiq/object_store/models.py +36 -0
- aiq/object_store/register.py +20 -0
- aiq/observability/__init__.py +14 -0
- aiq/observability/exporter/__init__.py +14 -0
- aiq/observability/exporter/base_exporter.py +449 -0
- aiq/observability/exporter/exporter.py +78 -0
- aiq/observability/exporter/file_exporter.py +33 -0
- aiq/observability/exporter/processing_exporter.py +322 -0
- aiq/observability/exporter/raw_exporter.py +52 -0
- aiq/observability/exporter/span_exporter.py +265 -0
- aiq/observability/exporter_manager.py +335 -0
- aiq/observability/mixin/__init__.py +14 -0
- aiq/observability/mixin/batch_config_mixin.py +26 -0
- aiq/observability/mixin/collector_config_mixin.py +23 -0
- aiq/observability/mixin/file_mixin.py +288 -0
- aiq/observability/mixin/file_mode.py +23 -0
- aiq/observability/mixin/resource_conflict_mixin.py +134 -0
- aiq/observability/mixin/serialize_mixin.py +61 -0
- aiq/observability/mixin/type_introspection_mixin.py +183 -0
- aiq/observability/processor/__init__.py +14 -0
- aiq/observability/processor/batching_processor.py +310 -0
- aiq/observability/processor/callback_processor.py +42 -0
- aiq/observability/processor/intermediate_step_serializer.py +28 -0
- aiq/observability/processor/processor.py +71 -0
- aiq/observability/register.py +96 -0
- aiq/observability/utils/__init__.py +14 -0
- aiq/observability/utils/dict_utils.py +236 -0
- aiq/observability/utils/time_utils.py +31 -0
- aiq/plugins/.namespace +1 -0
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/calc/__init__.py +14 -0
- aiq/profiler/calc/calc_runner.py +627 -0
- aiq/profiler/calc/calculations.py +288 -0
- aiq/profiler/calc/data_models.py +188 -0
- aiq/profiler/calc/plot.py +345 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +295 -0
- aiq/profiler/callbacks/base_callback_class.py +20 -0
- aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
- aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- aiq/profiler/callbacks/token_usage_base_model.py +27 -0
- aiq/profiler/data_frame_row.py +51 -0
- aiq/profiler/data_models.py +24 -0
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +131 -0
- aiq/profiler/decorators/function_tracking.py +254 -0
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +18 -0
- aiq/profiler/forecasting/model_trainer.py +75 -0
- aiq/profiler/forecasting/models/__init__.py +22 -0
- aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
- aiq/profiler/forecasting/models/linear_model.py +196 -0
- aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
- aiq/profiler/inference_metrics_model.py +28 -0
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- aiq/profiler/inference_optimization/data_models.py +386 -0
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- aiq/profiler/inference_optimization/llm_metrics.py +212 -0
- aiq/profiler/inference_optimization/prompt_caching.py +163 -0
- aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
- aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
- aiq/profiler/intermediate_property_adapter.py +102 -0
- aiq/profiler/profile_runner.py +473 -0
- aiq/profiler/utils.py +184 -0
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +176 -0
- aiq/registry_handlers/local/register_local.py +37 -0
- aiq/registry_handlers/metadata_factory.py +60 -0
- aiq/registry_handlers/package_utils.py +567 -0
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +251 -0
- aiq/registry_handlers/pypi/register_pypi.py +40 -0
- aiq/registry_handlers/register.py +21 -0
- aiq/registry_handlers/registry_handler_base.py +157 -0
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +56 -0
- aiq/registry_handlers/rest/rest_handler.py +237 -0
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +42 -0
- aiq/registry_handlers/schemas/package.py +68 -0
- aiq/registry_handlers/schemas/publish.py +63 -0
- aiq/registry_handlers/schemas/pull.py +82 -0
- aiq/registry_handlers/schemas/remove.py +36 -0
- aiq/registry_handlers/schemas/search.py +91 -0
- aiq/registry_handlers/schemas/status.py +47 -0
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +37 -0
- aiq/retriever/milvus/__init__.py +14 -0
- aiq/retriever/milvus/register.py +81 -0
- aiq/retriever/milvus/retriever.py +228 -0
- aiq/retriever/models.py +74 -0
- aiq/retriever/nemo_retriever/__init__.py +14 -0
- aiq/retriever/nemo_retriever/register.py +60 -0
- aiq/retriever/nemo_retriever/retriever.py +190 -0
- aiq/retriever/register.py +22 -0
- aiq/runtime/__init__.py +14 -0
- aiq/runtime/loader.py +215 -0
- aiq/runtime/runner.py +190 -0
- aiq/runtime/session.py +158 -0
- aiq/runtime/user_metadata.py +130 -0
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +318 -0
- aiq/test/.namespace +1 -0
- aiq/tool/__init__.py +0 -0
- aiq/tool/chat_completion.py +74 -0
- aiq/tool/code_execution/README.md +151 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +267 -0
- aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- aiq/tool/code_execution/register.py +74 -0
- aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
- aiq/tool/code_execution/utils.py +100 -0
- aiq/tool/datetime_tools.py +42 -0
- aiq/tool/document_search.py +141 -0
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +133 -0
- aiq/tool/github_tools/create_github_issue.py +87 -0
- aiq/tool/github_tools/create_github_pr.py +106 -0
- aiq/tool/github_tools/get_github_file.py +106 -0
- aiq/tool/github_tools/get_github_issue.py +166 -0
- aiq/tool/github_tools/get_github_pr.py +256 -0
- aiq/tool/github_tools/update_github_issue.py +100 -0
- aiq/tool/mcp/__init__.py +14 -0
- aiq/tool/mcp/exceptions.py +142 -0
- aiq/tool/mcp/mcp_client.py +255 -0
- aiq/tool/mcp/mcp_tool.py +96 -0
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +79 -0
- aiq/tool/memory_tools/delete_memory_tool.py +67 -0
- aiq/tool/memory_tools/get_memory_tool.py +72 -0
- aiq/tool/nvidia_rag.py +95 -0
- aiq/tool/register.py +38 -0
- aiq/tool/retriever.py +89 -0
- aiq/tool/server_tools.py +66 -0
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +58 -0
- aiq/utils/debugging_utils.py +43 -0
- aiq/utils/dump_distro_mapping.py +32 -0
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/automatic_retries.py +289 -0
- aiq/utils/exception_handlers/mcp.py +211 -0
- aiq/utils/exception_handlers/schemas.py +114 -0
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/model_processing.py +28 -0
- aiq/utils/io/yaml_tools.py +119 -0
- aiq/utils/log_utils.py +37 -0
- aiq/utils/metadata_utils.py +74 -0
- aiq/utils/optional_imports.py +142 -0
- aiq/utils/producer_consumer_queue.py +178 -0
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +65 -0
- aiq/utils/reactive/base/observer_base.py +55 -0
- aiq/utils/reactive/base/subject_base.py +79 -0
- aiq/utils/reactive/observable.py +59 -0
- aiq/utils/reactive/observer.py +76 -0
- aiq/utils/reactive/subject.py +131 -0
- aiq/utils/reactive/subscription.py +49 -0
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +197 -0
- aiq/utils/string_utils.py +38 -0
- aiq/utils/type_converter.py +290 -0
- aiq/utils/type_utils.py +484 -0
- aiq/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
- nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,44 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from .common import BaseModelRegistryTag
|
|
19
|
+
from .common import TypedBaseModel
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class ObjectStoreBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
+
pass
|
|
24
|
+
|
|
25
|
+
|
|
26
|
+
ObjectStoreBaseConfigT = typing.TypeVar("ObjectStoreBaseConfigT", bound=ObjectStoreBaseConfig)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class KeyAlreadyExistsError(Exception):
|
|
30
|
+
|
|
31
|
+
def __init__(self, key: str, additional_message: str | None = None):
|
|
32
|
+
parts = [f"Key already exists: {key}."]
|
|
33
|
+
if additional_message:
|
|
34
|
+
parts.append(additional_message)
|
|
35
|
+
super().__init__(" ".join(parts))
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
class NoSuchKeyError(Exception):
|
|
39
|
+
|
|
40
|
+
def __init__(self, key: str, additional_message: str | None = None):
|
|
41
|
+
parts = [f"No object found with key: {key}."]
|
|
42
|
+
if additional_message:
|
|
43
|
+
parts.append(additional_message)
|
|
44
|
+
super().__init__(" ".join(parts))
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import BaseModel
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
class PromptCachingConfig(BaseModel):
|
|
20
|
+
enable: bool = False
|
|
21
|
+
min_frequency: float = 0.5
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
class BottleneckConfig(BaseModel):
|
|
25
|
+
enable_simple_stack: bool = False
|
|
26
|
+
enable_nested_stack: bool = False
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class ConcurrencySpikeConfig(BaseModel):
|
|
30
|
+
enable: bool = False
|
|
31
|
+
spike_threshold: int = 1
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class PrefixSpanConfig(BaseModel):
|
|
35
|
+
enable: bool = False
|
|
36
|
+
min_support: float = 2
|
|
37
|
+
min_coverage: float = 0
|
|
38
|
+
max_text_len: int = 1000
|
|
39
|
+
top_k: int = 10
|
|
40
|
+
chain_with_common_prefixes: bool = False
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
class ProfilerConfig(BaseModel):
|
|
44
|
+
|
|
45
|
+
base_metrics: bool = False
|
|
46
|
+
token_usage_forecast: bool = False
|
|
47
|
+
token_uniqueness_forecast: bool = False
|
|
48
|
+
workflow_runtime_forecast: bool = False
|
|
49
|
+
compute_llm_metrics: bool = False
|
|
50
|
+
csv_exclude_io_text: bool = False
|
|
51
|
+
prompt_caching_prefixes: PromptCachingConfig = PromptCachingConfig()
|
|
52
|
+
bottleneck_analysis: BottleneckConfig = BottleneckConfig()
|
|
53
|
+
concurrency_spike_analysis: ConcurrencySpikeConfig = ConcurrencySpikeConfig()
|
|
54
|
+
prefix_span_analysis: PrefixSpanConfig = PrefixSpanConfig()
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from .common import BaseModelRegistryTag
|
|
19
|
+
from .common import TypedBaseModel
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class RegistryHandlerBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
+
pass
|
|
24
|
+
|
|
25
|
+
|
|
26
|
+
RegistryHandlerBaseConfigT = typing.TypeVar("RegistryHandlerBaseConfigT", bound=RegistryHandlerBaseConfig)
|
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from aiq.data_models.common import BaseModelRegistryTag
|
|
19
|
+
from aiq.data_models.common import TypedBaseModel
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class RetrieverBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
+
"""
|
|
24
|
+
The base level config object for a retriever object. Retrievers use different provider clients (e.g., Milvus) to
|
|
25
|
+
provide an interface for searching for and retrieving documents from the configured data store.
|
|
26
|
+
"""
|
|
27
|
+
pass
|
|
28
|
+
|
|
29
|
+
|
|
30
|
+
RetrieverBaseConfigT = typing.TypeVar("RetrieverBaseConfigT", bound=RetrieverBaseConfig)
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import BaseModel
|
|
17
|
+
from pydantic import Field
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
class RetryMixin(BaseModel):
|
|
21
|
+
"""Mixin class for retry configuration."""
|
|
22
|
+
do_auto_retry: bool = Field(default=True,
|
|
23
|
+
description="Whether to automatically retry method calls"
|
|
24
|
+
" that fail with a retryable error.",
|
|
25
|
+
exclude=True)
|
|
26
|
+
num_retries: int = Field(default=5,
|
|
27
|
+
description="Number of times to retry a method call that fails"
|
|
28
|
+
" with a retryable error.",
|
|
29
|
+
exclude=True)
|
|
30
|
+
retry_on_status_codes: list[int | str] = Field(default_factory=lambda: [429, 500, 502, 503, 504],
|
|
31
|
+
description="List of HTTP status codes that should trigger a retry.",
|
|
32
|
+
exclude=True)
|
|
33
|
+
retry_on_errors: list[str] | None = Field(default_factory=lambda: ["Too Many Requests"],
|
|
34
|
+
description="List of error substrings that should trigger a retry.",
|
|
35
|
+
exclude=True)
|
aiq/data_models/span.py
ADDED
|
@@ -0,0 +1,187 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
import time
|
|
18
|
+
import uuid
|
|
19
|
+
from enum import Enum
|
|
20
|
+
from typing import Any
|
|
21
|
+
|
|
22
|
+
from pydantic import BaseModel
|
|
23
|
+
from pydantic import Field
|
|
24
|
+
from pydantic import field_validator
|
|
25
|
+
|
|
26
|
+
logger = logging.getLogger(__name__)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
class SpanKind(Enum):
|
|
30
|
+
LLM = "LLM"
|
|
31
|
+
TOOL = "TOOL"
|
|
32
|
+
WORKFLOW = "WORKFLOW"
|
|
33
|
+
TASK = "TASK"
|
|
34
|
+
FUNCTION = "FUNCTION"
|
|
35
|
+
CUSTOM = "CUSTOM"
|
|
36
|
+
SPAN = "SPAN"
|
|
37
|
+
EMBEDDER = "EMBEDDER"
|
|
38
|
+
RETRIEVER = "RETRIEVER"
|
|
39
|
+
AGENT = "AGENT"
|
|
40
|
+
RERANKER = "RERANKER"
|
|
41
|
+
GUARDRAIL = "GUARDRAIL"
|
|
42
|
+
EVALUATOR = "EVALUATOR"
|
|
43
|
+
UNKNOWN = "UNKNOWN"
|
|
44
|
+
|
|
45
|
+
|
|
46
|
+
EVENT_TYPE_TO_SPAN_KIND_MAP = {
|
|
47
|
+
"LLM_START": SpanKind.LLM,
|
|
48
|
+
"LLM_END": SpanKind.LLM,
|
|
49
|
+
"LLM_NEW_TOKEN": SpanKind.LLM,
|
|
50
|
+
"TOOL_START": SpanKind.TOOL,
|
|
51
|
+
"TOOL_END": SpanKind.TOOL,
|
|
52
|
+
"WORKFLOW_START": SpanKind.WORKFLOW,
|
|
53
|
+
"WORKFLOW_END": SpanKind.WORKFLOW,
|
|
54
|
+
"TASK_START": SpanKind.TASK,
|
|
55
|
+
"TASK_END": SpanKind.TASK,
|
|
56
|
+
"FUNCTION_START": SpanKind.FUNCTION,
|
|
57
|
+
"FUNCTION_END": SpanKind.FUNCTION,
|
|
58
|
+
"CUSTOM_START": SpanKind.CUSTOM,
|
|
59
|
+
"CUSTOM_END": SpanKind.CUSTOM,
|
|
60
|
+
"SPAN_START": SpanKind.SPAN,
|
|
61
|
+
"SPAN_END": SpanKind.SPAN,
|
|
62
|
+
"EMBEDDER_START": SpanKind.EMBEDDER,
|
|
63
|
+
"EMBEDDER_END": SpanKind.EMBEDDER,
|
|
64
|
+
"RETRIEVER_START": SpanKind.RETRIEVER,
|
|
65
|
+
"RETRIEVER_END": SpanKind.RETRIEVER,
|
|
66
|
+
"AGENT_START": SpanKind.AGENT,
|
|
67
|
+
"AGENT_END": SpanKind.AGENT,
|
|
68
|
+
"RERANKER_START": SpanKind.RERANKER,
|
|
69
|
+
"RERANKER_END": SpanKind.RERANKER,
|
|
70
|
+
"GUARDRAIL_START": SpanKind.GUARDRAIL,
|
|
71
|
+
"GUARDRAIL_END": SpanKind.GUARDRAIL,
|
|
72
|
+
"EVALUATOR_START": SpanKind.EVALUATOR,
|
|
73
|
+
"EVALUATOR_END": SpanKind.EVALUATOR,
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
|
|
77
|
+
def event_type_to_span_kind(event_type: str) -> SpanKind:
|
|
78
|
+
"""Convert an event type to a span kind.
|
|
79
|
+
|
|
80
|
+
Args:
|
|
81
|
+
event_type (str): The event type to convert.
|
|
82
|
+
|
|
83
|
+
Returns:
|
|
84
|
+
SpanKind: The span kind.
|
|
85
|
+
"""
|
|
86
|
+
return EVENT_TYPE_TO_SPAN_KIND_MAP.get(event_type, SpanKind.UNKNOWN)
|
|
87
|
+
|
|
88
|
+
|
|
89
|
+
class SpanAttributes(Enum):
|
|
90
|
+
AIQ_SPAN_KIND = "aiq.span.kind"
|
|
91
|
+
INPUT_VALUE = "input.value"
|
|
92
|
+
INPUT_MIME_TYPE = "input.mime_type"
|
|
93
|
+
LLM_TOKEN_COUNT_PROMPT = "llm.token_count.prompt"
|
|
94
|
+
LLM_TOKEN_COUNT_COMPLETION = "llm.token_count.completion"
|
|
95
|
+
LLM_TOKEN_COUNT_TOTAL = "llm.token_count.total"
|
|
96
|
+
OUTPUT_VALUE = "output.value"
|
|
97
|
+
OUTPUT_MIME_TYPE = "output.mime_type"
|
|
98
|
+
AIQ_USAGE_NUM_LLM_CALLS = "aiq.usage.num_llm_calls"
|
|
99
|
+
AIQ_USAGE_SECONDS_BETWEEN_CALLS = "aiq.usage.seconds_between_calls"
|
|
100
|
+
AIQ_USAGE_TOKEN_COUNT_PROMPT = "aiq.usage.token_count.prompt"
|
|
101
|
+
AIQ_USAGE_TOKEN_COUNT_COMPLETION = "aiq.usage.token_count.completion"
|
|
102
|
+
AIQ_USAGE_TOKEN_COUNT_TOTAL = "aiq.usage.token_count.total"
|
|
103
|
+
AIQ_EVENT_TYPE = "aiq.event_type"
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
class MimeTypes(Enum):
|
|
107
|
+
TEXT = "text/plain"
|
|
108
|
+
JSON = "application/json"
|
|
109
|
+
|
|
110
|
+
|
|
111
|
+
class SpanStatusCode(Enum):
|
|
112
|
+
OK = "OK"
|
|
113
|
+
ERROR = "ERROR"
|
|
114
|
+
UNSET = "UNSET"
|
|
115
|
+
|
|
116
|
+
|
|
117
|
+
class SpanEvent(BaseModel):
|
|
118
|
+
timestamp: float = Field(default_factory=lambda: int(time.time() * 1e9), description="The timestamp of the event.")
|
|
119
|
+
name: str = Field(description="The name of the event.")
|
|
120
|
+
attributes: dict[str, Any] = Field(default_factory=dict, description="The attributes of the event.")
|
|
121
|
+
|
|
122
|
+
|
|
123
|
+
class SpanStatus(BaseModel):
|
|
124
|
+
code: SpanStatusCode = Field(default=SpanStatusCode.OK, description="The status code of the span.")
|
|
125
|
+
message: str | None = Field(default=None, description="The status message of the span.")
|
|
126
|
+
|
|
127
|
+
|
|
128
|
+
class SpanContext(BaseModel):
|
|
129
|
+
trace_id: int = Field(default_factory=lambda: uuid.uuid4().int, description="The 128-bit trace ID of the span.")
|
|
130
|
+
span_id: int = Field(default_factory=lambda: uuid.uuid4().int & ((1 << 64) - 1),
|
|
131
|
+
description="The 64-bit span ID of the span.")
|
|
132
|
+
|
|
133
|
+
|
|
134
|
+
class Span(BaseModel):
|
|
135
|
+
name: str = Field(description="The name of the span.")
|
|
136
|
+
context: SpanContext | None = Field(default=None, description="The context of the span.")
|
|
137
|
+
parent: "Span | None" = Field(default=None, description="The parent span of the span.")
|
|
138
|
+
start_time: int = Field(default_factory=lambda: int(time.time() * 1e9), description="The start time of the span.")
|
|
139
|
+
end_time: int | None = Field(default=None, description="The end time of the span.")
|
|
140
|
+
attributes: dict[str, Any] = Field(default_factory=dict, description="The attributes of the span.")
|
|
141
|
+
events: list[SpanEvent] = Field(default_factory=list, description="The events of the span.")
|
|
142
|
+
status: SpanStatus = Field(default_factory=SpanStatus, description="The status of the span.")
|
|
143
|
+
|
|
144
|
+
@field_validator('context', mode='before')
|
|
145
|
+
@classmethod
|
|
146
|
+
def set_default_context(cls, v: SpanContext | None) -> SpanContext:
|
|
147
|
+
"""Set the default context if the context is not provided.
|
|
148
|
+
|
|
149
|
+
Args:
|
|
150
|
+
v (SpanContext | None): The context to set.
|
|
151
|
+
|
|
152
|
+
Returns:
|
|
153
|
+
SpanContext: The context.
|
|
154
|
+
"""
|
|
155
|
+
if v is None:
|
|
156
|
+
return SpanContext()
|
|
157
|
+
return v
|
|
158
|
+
|
|
159
|
+
def set_attribute(self, key: str, value: Any) -> None:
|
|
160
|
+
"""Set the attribute of the span.
|
|
161
|
+
|
|
162
|
+
Args:
|
|
163
|
+
key (str): The key of the attribute.
|
|
164
|
+
value (Any): The value of the attribute.
|
|
165
|
+
"""
|
|
166
|
+
self.attributes[key] = value
|
|
167
|
+
|
|
168
|
+
def add_event(self, name: str, attributes: dict[str, Any] | None = None) -> None:
|
|
169
|
+
"""Add an event to the span.
|
|
170
|
+
|
|
171
|
+
Args:
|
|
172
|
+
name (str): The name of the event.
|
|
173
|
+
attributes (dict[str, Any] | None): The attributes of the event.
|
|
174
|
+
"""
|
|
175
|
+
if attributes is None:
|
|
176
|
+
attributes = {}
|
|
177
|
+
self.events = self.events + [SpanEvent(name=name, attributes=attributes)]
|
|
178
|
+
|
|
179
|
+
def end(self, end_time: int | None = None) -> None:
|
|
180
|
+
"""End the span.
|
|
181
|
+
|
|
182
|
+
Args:
|
|
183
|
+
end_time (int | None): The end time of the span.
|
|
184
|
+
"""
|
|
185
|
+
if end_time is None:
|
|
186
|
+
end_time = int(time.time() * 1e9)
|
|
187
|
+
self.end_time = end_time
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
from enum import Enum
|
|
18
|
+
|
|
19
|
+
from pydantic import BaseModel
|
|
20
|
+
from pydantic import Field
|
|
21
|
+
from pydantic import model_validator
|
|
22
|
+
|
|
23
|
+
from aiq.data_models.intermediate_step import IntermediateStepType
|
|
24
|
+
|
|
25
|
+
logger = logging.getLogger(__name__)
|
|
26
|
+
|
|
27
|
+
|
|
28
|
+
class StepAdaptorMode(str, Enum):
|
|
29
|
+
DEFAULT = "default"
|
|
30
|
+
CUSTOM = "custom"
|
|
31
|
+
OFF = "off"
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
class StepAdaptorConfig(BaseModel):
|
|
35
|
+
"""
|
|
36
|
+
Configures how intermediate steps are filtered and normalized by the StepAdaptor.
|
|
37
|
+
|
|
38
|
+
Args:
|
|
39
|
+
mode (StepAdaptorMode): One of:
|
|
40
|
+
- 'current' => pass only LLM (all LLM_* events) + TOOL_END
|
|
41
|
+
- 'end_events_only' => pass only LLM_END and TOOL_END
|
|
42
|
+
- 'custom' => pass only the events in custom_event_types
|
|
43
|
+
custom_event_types (list[IntermediateStepType]):
|
|
44
|
+
If mode == 'custom', we only pass events whose event_type is in this list.
|
|
45
|
+
Otherwise, this field is ignored.
|
|
46
|
+
"""
|
|
47
|
+
mode: StepAdaptorMode = StepAdaptorMode.DEFAULT
|
|
48
|
+
custom_event_types: list[IntermediateStepType] = Field(default_factory=list)
|
|
49
|
+
|
|
50
|
+
@model_validator(mode="after")
|
|
51
|
+
def check_custom_event_types(self) -> "StepAdaptorConfig":
|
|
52
|
+
"""
|
|
53
|
+
Validates custom configurations
|
|
54
|
+
"""
|
|
55
|
+
if self.mode != StepAdaptorMode.CUSTOM and self.custom_event_types:
|
|
56
|
+
logger.warning("Ignoring custom_event_types because mode is not 'custom'")
|
|
57
|
+
self.custom_event_types = []
|
|
58
|
+
elif self.mode == StepAdaptorMode.CUSTOM and not self.custom_event_types:
|
|
59
|
+
logger.warning("No custom_event_types provided for custom mode. Defaulting to CUSTOM_START and CUSTOM_END")
|
|
60
|
+
self.custom_event_types = [IntermediateStepType.CUSTOM_START, IntermediateStepType.CUSTOM_END]
|
|
61
|
+
elif self.mode == StepAdaptorMode.OFF:
|
|
62
|
+
logger.warning("StepAdaptor is disabled. Ignoring all intermediate event types")
|
|
63
|
+
self.custom_event_types = []
|
|
64
|
+
return self
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import inspect
|
|
17
|
+
import typing
|
|
18
|
+
from collections.abc import Callable
|
|
19
|
+
|
|
20
|
+
_T = typing.TypeVar("_T")
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
class Streaming(typing.Generic[_T]):
|
|
24
|
+
|
|
25
|
+
def __init__(self, *, convert: Callable[[typing.Any], _T] = None):
|
|
26
|
+
self.convert = convert
|
|
27
|
+
|
|
28
|
+
sig = inspect.signature(self.convert)
|
|
29
|
+
|
|
30
|
+
if (sig.return_annotation == inspect.Parameter.empty):
|
|
31
|
+
raise ValueError("convert must have a return annotation")
|
|
32
|
+
|
|
33
|
+
self.single_output_type = sig.return_annotation
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import json
|
|
17
|
+
|
|
18
|
+
from pydantic import BaseModel
|
|
19
|
+
from pydantic import ConfigDict
|
|
20
|
+
from pydantic import field_validator
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
class SWEBenchInput(BaseModel):
|
|
24
|
+
# Allow extra fields in the model_config to support derived models
|
|
25
|
+
model_config = ConfigDict(extra="allow")
|
|
26
|
+
|
|
27
|
+
repo: str
|
|
28
|
+
instance_id: str
|
|
29
|
+
base_commit: str
|
|
30
|
+
patch: str
|
|
31
|
+
test_patch: str
|
|
32
|
+
problem_statement: str
|
|
33
|
+
hints_text: str
|
|
34
|
+
created_at: str | int
|
|
35
|
+
version: float
|
|
36
|
+
FAIL_TO_PASS: list[str]
|
|
37
|
+
PASS_TO_PASS: list[str]
|
|
38
|
+
environment_setup_commit: str
|
|
39
|
+
|
|
40
|
+
# Handle improperly formatted JSON strings for list fields
|
|
41
|
+
@field_validator("FAIL_TO_PASS", "PASS_TO_PASS", mode="before")
|
|
42
|
+
def parse_list_fields(cls, value): # pylint: disable=no-self-argument
|
|
43
|
+
if isinstance(value, str):
|
|
44
|
+
# Attempt to parse the string as a list
|
|
45
|
+
return json.loads(value)
|
|
46
|
+
return value
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
class SWEBenchOutput(BaseModel):
|
|
50
|
+
model_config = ConfigDict(protected_namespaces=(), populate_by_name=True)
|
|
51
|
+
|
|
52
|
+
instance_id: str
|
|
53
|
+
model_name_or_path: str
|
|
54
|
+
model_patch: str
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from aiq.data_models.common import BaseModelRegistryTag
|
|
19
|
+
from aiq.data_models.common import TypedBaseModel
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class TelemetryExporterBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
+
pass
|
|
24
|
+
|
|
25
|
+
|
|
26
|
+
TelemetryExporterConfigT = typing.TypeVar("TelemetryExporterConfigT", bound=TelemetryExporterBaseConfig)
|
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import typing
|
|
17
|
+
|
|
18
|
+
from .common import BaseModelRegistryTag
|
|
19
|
+
from .common import TypedBaseModel
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class TTCStrategyBaseConfig(TypedBaseModel, BaseModelRegistryTag):
|
|
23
|
+
"""
|
|
24
|
+
Base configuration class for Test Time Compute (TTC) strategy.
|
|
25
|
+
This class is used to define the structure of TTC strategy configurations.
|
|
26
|
+
"""
|
|
27
|
+
pass
|
|
28
|
+
|
|
29
|
+
|
|
30
|
+
TTCStrategyBaseConfigT = typing.TypeVar("TTCStrategyBaseConfigT", bound=TTCStrategyBaseConfig)
|
aiq/embedder/__init__.py
ADDED
|
File without changes
|
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from aiq.builder.builder import Builder
|
|
17
|
+
from aiq.builder.framework_enum import LLMFrameworkEnum
|
|
18
|
+
from aiq.cli.register_workflow import register_embedder_client
|
|
19
|
+
from aiq.embedder.nim_embedder import NIMEmbedderModelConfig
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
@register_embedder_client(config_type=NIMEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
|
|
23
|
+
async def nim_langchain(embedder_config: NIMEmbedderModelConfig, builder: Builder):
|
|
24
|
+
|
|
25
|
+
from langchain_nvidia_ai_endpoints import NVIDIAEmbeddings
|
|
26
|
+
|
|
27
|
+
yield NVIDIAEmbeddings(**embedder_config.model_dump(exclude={"type"}, by_alias=True))
|
|
28
|
+
|
|
29
|
+
|
|
30
|
+
@register_embedder_client(config_type=NIMEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
|
|
31
|
+
async def nim_llamaindex(embedder_config: NIMEmbedderModelConfig, builder: Builder):
|
|
32
|
+
|
|
33
|
+
from llama_index.embeddings.nvidia import NVIDIAEmbedding # pylint: disable=no-name-in-module
|
|
34
|
+
|
|
35
|
+
config_obj = {
|
|
36
|
+
**embedder_config.model_dump(exclude={"type", "model_name"}, by_alias=True),
|
|
37
|
+
"model":
|
|
38
|
+
embedder_config.model_name,
|
|
39
|
+
}
|
|
40
|
+
|
|
41
|
+
yield NVIDIAEmbedding(**config_obj)
|