nvidia-nat 1.2.0rc5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +239 -0
- aiq/agent/dual_node.py +67 -0
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +355 -0
- aiq/agent/react_agent/output_parser.py +104 -0
- aiq/agent/react_agent/prompt.py +41 -0
- aiq/agent/react_agent/register.py +149 -0
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
- aiq/agent/register.py +23 -0
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +411 -0
- aiq/agent/rewoo_agent/prompt.py +108 -0
- aiq/agent/rewoo_agent/register.py +158 -0
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +119 -0
- aiq/agent/tool_calling_agent/register.py +106 -0
- aiq/authentication/__init__.py +14 -0
- aiq/authentication/api_key/__init__.py +14 -0
- aiq/authentication/api_key/api_key_auth_provider.py +96 -0
- aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
- aiq/authentication/api_key/register.py +26 -0
- aiq/authentication/exceptions/__init__.py +14 -0
- aiq/authentication/exceptions/api_key_exceptions.py +38 -0
- aiq/authentication/http_basic_auth/__init__.py +0 -0
- aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- aiq/authentication/http_basic_auth/register.py +30 -0
- aiq/authentication/interfaces.py +93 -0
- aiq/authentication/oauth2/__init__.py +14 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- aiq/authentication/oauth2/register.py +25 -0
- aiq/authentication/register.py +21 -0
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +285 -0
- aiq/builder/component_utils.py +316 -0
- aiq/builder/context.py +264 -0
- aiq/builder/embedder.py +24 -0
- aiq/builder/eval_builder.py +161 -0
- aiq/builder/evaluator.py +29 -0
- aiq/builder/framework_enum.py +24 -0
- aiq/builder/front_end.py +73 -0
- aiq/builder/function.py +344 -0
- aiq/builder/function_base.py +380 -0
- aiq/builder/function_info.py +627 -0
- aiq/builder/intermediate_step_manager.py +174 -0
- aiq/builder/llm.py +25 -0
- aiq/builder/retriever.py +25 -0
- aiq/builder/user_interaction_manager.py +74 -0
- aiq/builder/workflow.py +148 -0
- aiq/builder/workflow_builder.py +1117 -0
- aiq/cli/__init__.py +14 -0
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +231 -0
- aiq/cli/cli_utils/validation.py +37 -0
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +28 -0
- aiq/cli/commands/configure/channel/channel.py +36 -0
- aiq/cli/commands/configure/channel/remove.py +30 -0
- aiq/cli/commands/configure/channel/update.py +30 -0
- aiq/cli/commands/configure/configure.py +33 -0
- aiq/cli/commands/evaluate.py +139 -0
- aiq/cli/commands/info/__init__.py +14 -0
- aiq/cli/commands/info/info.py +39 -0
- aiq/cli/commands/info/list_channels.py +32 -0
- aiq/cli/commands/info/list_components.py +129 -0
- aiq/cli/commands/info/list_mcp.py +213 -0
- aiq/cli/commands/registry/__init__.py +14 -0
- aiq/cli/commands/registry/publish.py +88 -0
- aiq/cli/commands/registry/pull.py +118 -0
- aiq/cli/commands/registry/registry.py +38 -0
- aiq/cli/commands/registry/remove.py +108 -0
- aiq/cli/commands/registry/search.py +155 -0
- aiq/cli/commands/sizing/__init__.py +14 -0
- aiq/cli/commands/sizing/calc.py +297 -0
- aiq/cli/commands/sizing/sizing.py +27 -0
- aiq/cli/commands/start.py +246 -0
- aiq/cli/commands/uninstall.py +81 -0
- aiq/cli/commands/validate.py +47 -0
- aiq/cli/commands/workflow/__init__.py +14 -0
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
- aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- aiq/cli/commands/workflow/workflow.py +37 -0
- aiq/cli/commands/workflow/workflow_commands.py +313 -0
- aiq/cli/entrypoint.py +135 -0
- aiq/cli/main.py +44 -0
- aiq/cli/register_workflow.py +488 -0
- aiq/cli/type_registry.py +1000 -0
- aiq/data_models/__init__.py +14 -0
- aiq/data_models/api_server.py +694 -0
- aiq/data_models/authentication.py +231 -0
- aiq/data_models/common.py +171 -0
- aiq/data_models/component.py +54 -0
- aiq/data_models/component_ref.py +168 -0
- aiq/data_models/config.py +406 -0
- aiq/data_models/dataset_handler.py +123 -0
- aiq/data_models/discovery_metadata.py +335 -0
- aiq/data_models/embedder.py +27 -0
- aiq/data_models/evaluate.py +127 -0
- aiq/data_models/evaluator.py +26 -0
- aiq/data_models/front_end.py +26 -0
- aiq/data_models/function.py +30 -0
- aiq/data_models/function_dependencies.py +72 -0
- aiq/data_models/interactive.py +246 -0
- aiq/data_models/intermediate_step.py +302 -0
- aiq/data_models/invocation_node.py +38 -0
- aiq/data_models/llm.py +27 -0
- aiq/data_models/logging.py +26 -0
- aiq/data_models/memory.py +27 -0
- aiq/data_models/object_store.py +44 -0
- aiq/data_models/profiler.py +54 -0
- aiq/data_models/registry_handler.py +26 -0
- aiq/data_models/retriever.py +30 -0
- aiq/data_models/retry_mixin.py +35 -0
- aiq/data_models/span.py +187 -0
- aiq/data_models/step_adaptor.py +64 -0
- aiq/data_models/streaming.py +33 -0
- aiq/data_models/swe_bench_model.py +54 -0
- aiq/data_models/telemetry_exporter.py +26 -0
- aiq/data_models/ttc_strategy.py +30 -0
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +41 -0
- aiq/embedder/nim_embedder.py +59 -0
- aiq/embedder/openai_embedder.py +43 -0
- aiq/embedder/register.py +24 -0
- aiq/eval/__init__.py +14 -0
- aiq/eval/config.py +60 -0
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +106 -0
- aiq/eval/dataset_handler/dataset_filter.py +52 -0
- aiq/eval/dataset_handler/dataset_handler.py +254 -0
- aiq/eval/evaluate.py +506 -0
- aiq/eval/evaluator/__init__.py +14 -0
- aiq/eval/evaluator/base_evaluator.py +73 -0
- aiq/eval/evaluator/evaluator_model.py +45 -0
- aiq/eval/intermediate_step_adapter.py +99 -0
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +178 -0
- aiq/eval/rag_evaluator/register.py +143 -0
- aiq/eval/register.py +23 -0
- aiq/eval/remote_workflow.py +133 -0
- aiq/eval/runners/__init__.py +14 -0
- aiq/eval/runners/config.py +39 -0
- aiq/eval/runners/multi_eval_runner.py +54 -0
- aiq/eval/runtime_event_subscriber.py +52 -0
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
- aiq/eval/swe_bench_evaluator/register.py +36 -0
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +75 -0
- aiq/eval/trajectory_evaluator/register.py +40 -0
- aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
- aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
- aiq/eval/tunable_rag_evaluator/register.py +52 -0
- aiq/eval/usage_stats.py +41 -0
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +140 -0
- aiq/eval/utils/tqdm_position_registry.py +40 -0
- aiq/eval/utils/weave_eval.py +184 -0
- aiq/experimental/__init__.py +0 -0
- aiq/experimental/decorators/__init__.py +0 -0
- aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
- aiq/experimental/test_time_compute/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- aiq/experimental/test_time_compute/functions/__init__.py +0 -0
- aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
- aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
- aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- aiq/experimental/test_time_compute/models/__init__.py +0 -0
- aiq/experimental/test_time_compute/models/editor_config.py +132 -0
- aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
- aiq/experimental/test_time_compute/models/search_config.py +120 -0
- aiq/experimental/test_time_compute/models/selection_config.py +154 -0
- aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
- aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
- aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
- aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
- aiq/experimental/test_time_compute/register.py +36 -0
- aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
- aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- aiq/experimental/test_time_compute/search/__init__.py +0 -0
- aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- aiq/experimental/test_time_compute/selection/__init__.py +0 -0
- aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- aiq/front_ends/__init__.py +14 -0
- aiq/front_ends/console/__init__.py +14 -0
- aiq/front_ends/console/authentication_flow_handler.py +233 -0
- aiq/front_ends/console/console_front_end_config.py +32 -0
- aiq/front_ends/console/console_front_end_plugin.py +96 -0
- aiq/front_ends/console/register.py +25 -0
- aiq/front_ends/cron/__init__.py +14 -0
- aiq/front_ends/fastapi/__init__.py +14 -0
- aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
- aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
- aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
- aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- aiq/front_ends/fastapi/job_store.py +183 -0
- aiq/front_ends/fastapi/main.py +72 -0
- aiq/front_ends/fastapi/message_handler.py +298 -0
- aiq/front_ends/fastapi/message_validator.py +345 -0
- aiq/front_ends/fastapi/register.py +25 -0
- aiq/front_ends/fastapi/response_helpers.py +195 -0
- aiq/front_ends/fastapi/step_adaptor.py +321 -0
- aiq/front_ends/mcp/__init__.py +14 -0
- aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
- aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
- aiq/front_ends/mcp/register.py +27 -0
- aiq/front_ends/mcp/tool_converter.py +242 -0
- aiq/front_ends/register.py +22 -0
- aiq/front_ends/simple_base/__init__.py +14 -0
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- aiq/llm/__init__.py +0 -0
- aiq/llm/aws_bedrock_llm.py +57 -0
- aiq/llm/nim_llm.py +46 -0
- aiq/llm/openai_llm.py +46 -0
- aiq/llm/register.py +23 -0
- aiq/llm/utils/__init__.py +14 -0
- aiq/llm/utils/env_config_value.py +94 -0
- aiq/llm/utils/error.py +17 -0
- aiq/memory/__init__.py +20 -0
- aiq/memory/interfaces.py +183 -0
- aiq/memory/models.py +112 -0
- aiq/meta/module_to_distro.json +3 -0
- aiq/meta/pypi.md +58 -0
- aiq/object_store/__init__.py +20 -0
- aiq/object_store/in_memory_object_store.py +76 -0
- aiq/object_store/interfaces.py +84 -0
- aiq/object_store/models.py +36 -0
- aiq/object_store/register.py +20 -0
- aiq/observability/__init__.py +14 -0
- aiq/observability/exporter/__init__.py +14 -0
- aiq/observability/exporter/base_exporter.py +449 -0
- aiq/observability/exporter/exporter.py +78 -0
- aiq/observability/exporter/file_exporter.py +33 -0
- aiq/observability/exporter/processing_exporter.py +322 -0
- aiq/observability/exporter/raw_exporter.py +52 -0
- aiq/observability/exporter/span_exporter.py +265 -0
- aiq/observability/exporter_manager.py +335 -0
- aiq/observability/mixin/__init__.py +14 -0
- aiq/observability/mixin/batch_config_mixin.py +26 -0
- aiq/observability/mixin/collector_config_mixin.py +23 -0
- aiq/observability/mixin/file_mixin.py +288 -0
- aiq/observability/mixin/file_mode.py +23 -0
- aiq/observability/mixin/resource_conflict_mixin.py +134 -0
- aiq/observability/mixin/serialize_mixin.py +61 -0
- aiq/observability/mixin/type_introspection_mixin.py +183 -0
- aiq/observability/processor/__init__.py +14 -0
- aiq/observability/processor/batching_processor.py +310 -0
- aiq/observability/processor/callback_processor.py +42 -0
- aiq/observability/processor/intermediate_step_serializer.py +28 -0
- aiq/observability/processor/processor.py +71 -0
- aiq/observability/register.py +96 -0
- aiq/observability/utils/__init__.py +14 -0
- aiq/observability/utils/dict_utils.py +236 -0
- aiq/observability/utils/time_utils.py +31 -0
- aiq/plugins/.namespace +1 -0
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/calc/__init__.py +14 -0
- aiq/profiler/calc/calc_runner.py +627 -0
- aiq/profiler/calc/calculations.py +288 -0
- aiq/profiler/calc/data_models.py +188 -0
- aiq/profiler/calc/plot.py +345 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +295 -0
- aiq/profiler/callbacks/base_callback_class.py +20 -0
- aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
- aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- aiq/profiler/callbacks/token_usage_base_model.py +27 -0
- aiq/profiler/data_frame_row.py +51 -0
- aiq/profiler/data_models.py +24 -0
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +131 -0
- aiq/profiler/decorators/function_tracking.py +254 -0
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +18 -0
- aiq/profiler/forecasting/model_trainer.py +75 -0
- aiq/profiler/forecasting/models/__init__.py +22 -0
- aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
- aiq/profiler/forecasting/models/linear_model.py +196 -0
- aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
- aiq/profiler/inference_metrics_model.py +28 -0
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- aiq/profiler/inference_optimization/data_models.py +386 -0
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- aiq/profiler/inference_optimization/llm_metrics.py +212 -0
- aiq/profiler/inference_optimization/prompt_caching.py +163 -0
- aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
- aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
- aiq/profiler/intermediate_property_adapter.py +102 -0
- aiq/profiler/profile_runner.py +473 -0
- aiq/profiler/utils.py +184 -0
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +176 -0
- aiq/registry_handlers/local/register_local.py +37 -0
- aiq/registry_handlers/metadata_factory.py +60 -0
- aiq/registry_handlers/package_utils.py +567 -0
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +251 -0
- aiq/registry_handlers/pypi/register_pypi.py +40 -0
- aiq/registry_handlers/register.py +21 -0
- aiq/registry_handlers/registry_handler_base.py +157 -0
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +56 -0
- aiq/registry_handlers/rest/rest_handler.py +237 -0
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +42 -0
- aiq/registry_handlers/schemas/package.py +68 -0
- aiq/registry_handlers/schemas/publish.py +63 -0
- aiq/registry_handlers/schemas/pull.py +82 -0
- aiq/registry_handlers/schemas/remove.py +36 -0
- aiq/registry_handlers/schemas/search.py +91 -0
- aiq/registry_handlers/schemas/status.py +47 -0
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +37 -0
- aiq/retriever/milvus/__init__.py +14 -0
- aiq/retriever/milvus/register.py +81 -0
- aiq/retriever/milvus/retriever.py +228 -0
- aiq/retriever/models.py +74 -0
- aiq/retriever/nemo_retriever/__init__.py +14 -0
- aiq/retriever/nemo_retriever/register.py +60 -0
- aiq/retriever/nemo_retriever/retriever.py +190 -0
- aiq/retriever/register.py +22 -0
- aiq/runtime/__init__.py +14 -0
- aiq/runtime/loader.py +215 -0
- aiq/runtime/runner.py +190 -0
- aiq/runtime/session.py +158 -0
- aiq/runtime/user_metadata.py +130 -0
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +318 -0
- aiq/test/.namespace +1 -0
- aiq/tool/__init__.py +0 -0
- aiq/tool/chat_completion.py +74 -0
- aiq/tool/code_execution/README.md +151 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +267 -0
- aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- aiq/tool/code_execution/register.py +74 -0
- aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
- aiq/tool/code_execution/utils.py +100 -0
- aiq/tool/datetime_tools.py +42 -0
- aiq/tool/document_search.py +141 -0
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +133 -0
- aiq/tool/github_tools/create_github_issue.py +87 -0
- aiq/tool/github_tools/create_github_pr.py +106 -0
- aiq/tool/github_tools/get_github_file.py +106 -0
- aiq/tool/github_tools/get_github_issue.py +166 -0
- aiq/tool/github_tools/get_github_pr.py +256 -0
- aiq/tool/github_tools/update_github_issue.py +100 -0
- aiq/tool/mcp/__init__.py +14 -0
- aiq/tool/mcp/exceptions.py +142 -0
- aiq/tool/mcp/mcp_client.py +255 -0
- aiq/tool/mcp/mcp_tool.py +96 -0
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +79 -0
- aiq/tool/memory_tools/delete_memory_tool.py +67 -0
- aiq/tool/memory_tools/get_memory_tool.py +72 -0
- aiq/tool/nvidia_rag.py +95 -0
- aiq/tool/register.py +38 -0
- aiq/tool/retriever.py +89 -0
- aiq/tool/server_tools.py +66 -0
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +58 -0
- aiq/utils/debugging_utils.py +43 -0
- aiq/utils/dump_distro_mapping.py +32 -0
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/automatic_retries.py +289 -0
- aiq/utils/exception_handlers/mcp.py +211 -0
- aiq/utils/exception_handlers/schemas.py +114 -0
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/model_processing.py +28 -0
- aiq/utils/io/yaml_tools.py +119 -0
- aiq/utils/log_utils.py +37 -0
- aiq/utils/metadata_utils.py +74 -0
- aiq/utils/optional_imports.py +142 -0
- aiq/utils/producer_consumer_queue.py +178 -0
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +65 -0
- aiq/utils/reactive/base/observer_base.py +55 -0
- aiq/utils/reactive/base/subject_base.py +79 -0
- aiq/utils/reactive/observable.py +59 -0
- aiq/utils/reactive/observer.py +76 -0
- aiq/utils/reactive/subject.py +131 -0
- aiq/utils/reactive/subscription.py +49 -0
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +197 -0
- aiq/utils/string_utils.py +38 -0
- aiq/utils/type_converter.py +290 -0
- aiq/utils/type_utils.py +484 -0
- aiq/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
- nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,242 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import json
|
|
17
|
+
import logging
|
|
18
|
+
from inspect import Parameter
|
|
19
|
+
from inspect import Signature
|
|
20
|
+
|
|
21
|
+
from mcp.server.fastmcp import FastMCP
|
|
22
|
+
from pydantic import BaseModel
|
|
23
|
+
|
|
24
|
+
from aiq.builder.function import Function
|
|
25
|
+
from aiq.builder.function_base import FunctionBase
|
|
26
|
+
from aiq.builder.workflow import Workflow
|
|
27
|
+
|
|
28
|
+
logger = logging.getLogger(__name__)
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
def create_function_wrapper(
|
|
32
|
+
function_name: str,
|
|
33
|
+
function: FunctionBase,
|
|
34
|
+
schema: type[BaseModel],
|
|
35
|
+
is_workflow: bool = False,
|
|
36
|
+
):
|
|
37
|
+
"""Create a wrapper function that exposes the actual parameters of an AIQ Function as an MCP tool.
|
|
38
|
+
|
|
39
|
+
Args:
|
|
40
|
+
function_name: The name of the function/tool
|
|
41
|
+
function: The AIQ Function object
|
|
42
|
+
schema: The input schema of the function
|
|
43
|
+
is_workflow: Whether the function is a Workflow
|
|
44
|
+
|
|
45
|
+
Returns:
|
|
46
|
+
A wrapper function suitable for registration with MCP
|
|
47
|
+
"""
|
|
48
|
+
# Check if we're dealing with AIQChatRequest - special case
|
|
49
|
+
is_chat_request = False
|
|
50
|
+
|
|
51
|
+
# Check if the schema name is AIQChatRequest
|
|
52
|
+
if schema.__name__ == "AIQChatRequest" or (hasattr(schema, "__qualname__")
|
|
53
|
+
and "AIQChatRequest" in schema.__qualname__):
|
|
54
|
+
is_chat_request = True
|
|
55
|
+
logger.info("Function %s uses AIQChatRequest - creating simplified interface", function_name)
|
|
56
|
+
|
|
57
|
+
# For AIQChatRequest, we'll create a simple wrapper with just a query parameter
|
|
58
|
+
parameters = [Parameter(
|
|
59
|
+
name="query",
|
|
60
|
+
kind=Parameter.KEYWORD_ONLY,
|
|
61
|
+
default=Parameter.empty,
|
|
62
|
+
annotation=str,
|
|
63
|
+
)]
|
|
64
|
+
else:
|
|
65
|
+
# Regular case - extract parameter information from the input schema
|
|
66
|
+
# Extract parameter information from the input schema
|
|
67
|
+
param_fields = schema.model_fields
|
|
68
|
+
|
|
69
|
+
parameters = []
|
|
70
|
+
for name, field in param_fields.items():
|
|
71
|
+
# Get the field type and convert to appropriate Python type
|
|
72
|
+
field_type = field.annotation
|
|
73
|
+
|
|
74
|
+
# Add the parameter to our list
|
|
75
|
+
parameters.append(
|
|
76
|
+
Parameter(
|
|
77
|
+
name=name,
|
|
78
|
+
kind=Parameter.KEYWORD_ONLY,
|
|
79
|
+
default=Parameter.empty if field.is_required else None,
|
|
80
|
+
annotation=field_type,
|
|
81
|
+
))
|
|
82
|
+
|
|
83
|
+
# Create the function signature WITHOUT the ctx parameter
|
|
84
|
+
# We'll handle this in the wrapper function internally
|
|
85
|
+
sig = Signature(parameters=parameters, return_annotation=str)
|
|
86
|
+
|
|
87
|
+
# Define the actual wrapper function that accepts ctx but doesn't expose it
|
|
88
|
+
def create_wrapper():
|
|
89
|
+
|
|
90
|
+
async def wrapper_with_ctx(**kwargs):
|
|
91
|
+
"""Internal wrapper that will be called by MCP."""
|
|
92
|
+
# MCP will add a ctx parameter, extract it
|
|
93
|
+
ctx = kwargs.get("ctx")
|
|
94
|
+
|
|
95
|
+
# Remove ctx if present
|
|
96
|
+
if "ctx" in kwargs:
|
|
97
|
+
del kwargs["ctx"]
|
|
98
|
+
|
|
99
|
+
# Process the function call
|
|
100
|
+
if ctx:
|
|
101
|
+
ctx.info("Calling function %s with args: %s", function_name, json.dumps(kwargs, default=str))
|
|
102
|
+
await ctx.report_progress(0, 100)
|
|
103
|
+
|
|
104
|
+
try:
|
|
105
|
+
# Special handling for AIQChatRequest
|
|
106
|
+
if is_chat_request:
|
|
107
|
+
from aiq.data_models.api_server import AIQChatRequest
|
|
108
|
+
|
|
109
|
+
# Create a chat request from the query string
|
|
110
|
+
query = kwargs.get("query", "")
|
|
111
|
+
chat_request = AIQChatRequest.from_string(query)
|
|
112
|
+
|
|
113
|
+
# Special handling for Workflow objects
|
|
114
|
+
if is_workflow:
|
|
115
|
+
# Workflows have a run method that is an async context manager
|
|
116
|
+
# that returns an AIQRunner
|
|
117
|
+
async with function.run(chat_request) as runner:
|
|
118
|
+
# Get the result from the runner
|
|
119
|
+
result = await runner.result(to_type=str)
|
|
120
|
+
else:
|
|
121
|
+
# Regular functions use ainvoke
|
|
122
|
+
result = await function.ainvoke(chat_request, to_type=str)
|
|
123
|
+
else:
|
|
124
|
+
# Regular handling
|
|
125
|
+
# Handle complex input schema - if we extracted fields from a nested schema,
|
|
126
|
+
# we need to reconstruct the input
|
|
127
|
+
if len(schema.model_fields) == 1 and len(parameters) > 1:
|
|
128
|
+
# Get the field name from the original schema
|
|
129
|
+
field_name = next(iter(schema.model_fields.keys()))
|
|
130
|
+
field_type = schema.model_fields[field_name].annotation
|
|
131
|
+
|
|
132
|
+
# If it's a pydantic model, we need to create an instance
|
|
133
|
+
if hasattr(field_type, "model_validate"):
|
|
134
|
+
# Create the nested object
|
|
135
|
+
nested_obj = field_type.model_validate(kwargs)
|
|
136
|
+
# Call with the nested object
|
|
137
|
+
kwargs = {field_name: nested_obj}
|
|
138
|
+
|
|
139
|
+
# Call the AIQ function with the parameters - special handling for Workflow
|
|
140
|
+
if is_workflow:
|
|
141
|
+
# For workflow with regular input, we'll assume the first parameter is the input
|
|
142
|
+
input_value = list(kwargs.values())[0] if kwargs else ""
|
|
143
|
+
|
|
144
|
+
# Workflows have a run method that is an async context manager
|
|
145
|
+
# that returns an AIQRunner
|
|
146
|
+
async with function.run(input_value) as runner:
|
|
147
|
+
# Get the result from the runner
|
|
148
|
+
result = await runner.result(to_type=str)
|
|
149
|
+
else:
|
|
150
|
+
# Regular function call
|
|
151
|
+
result = await function.acall_invoke(**kwargs)
|
|
152
|
+
|
|
153
|
+
# Report completion
|
|
154
|
+
if ctx:
|
|
155
|
+
await ctx.report_progress(100, 100)
|
|
156
|
+
|
|
157
|
+
# Handle different result types for proper formatting
|
|
158
|
+
if isinstance(result, str):
|
|
159
|
+
return result
|
|
160
|
+
if isinstance(result, (dict, list)):
|
|
161
|
+
return json.dumps(result, default=str)
|
|
162
|
+
return str(result)
|
|
163
|
+
except Exception as e:
|
|
164
|
+
if ctx:
|
|
165
|
+
ctx.error("Error calling function %s: %s", function_name, str(e))
|
|
166
|
+
raise
|
|
167
|
+
|
|
168
|
+
return wrapper_with_ctx
|
|
169
|
+
|
|
170
|
+
# Create the wrapper function
|
|
171
|
+
wrapper = create_wrapper()
|
|
172
|
+
|
|
173
|
+
# Set the signature on the wrapper function (WITHOUT ctx)
|
|
174
|
+
wrapper.__signature__ = sig
|
|
175
|
+
wrapper.__name__ = function_name
|
|
176
|
+
|
|
177
|
+
# Return the wrapper with proper signature
|
|
178
|
+
return wrapper
|
|
179
|
+
|
|
180
|
+
|
|
181
|
+
def get_function_description(function: FunctionBase) -> str:
|
|
182
|
+
"""
|
|
183
|
+
Retrieve a human-readable description for an AIQ function or workflow.
|
|
184
|
+
|
|
185
|
+
The description is determined using the following precedence:
|
|
186
|
+
1. If the function is a Workflow and has a 'description' attribute, use it.
|
|
187
|
+
2. If the Workflow's config has a 'topic', use it.
|
|
188
|
+
3. If the Workflow's config has a 'description', use it.
|
|
189
|
+
4. If the function is a regular Function, use its 'description' attribute.
|
|
190
|
+
|
|
191
|
+
Args:
|
|
192
|
+
function: The AIQ FunctionBase instance (Function or Workflow).
|
|
193
|
+
|
|
194
|
+
Returns:
|
|
195
|
+
The best available description string for the function.
|
|
196
|
+
"""
|
|
197
|
+
function_description = ""
|
|
198
|
+
|
|
199
|
+
if isinstance(function, Workflow):
|
|
200
|
+
config = function.config
|
|
201
|
+
|
|
202
|
+
# Workflow doesn't have a description, but probably should
|
|
203
|
+
if hasattr(function, "description") and function.description:
|
|
204
|
+
function_description = function.description
|
|
205
|
+
# Try to get description from config
|
|
206
|
+
elif hasattr(config, "description") and config.description:
|
|
207
|
+
function_description = config.description
|
|
208
|
+
# Try to get anything that might be a description
|
|
209
|
+
elif hasattr(config, "topic") and config.topic:
|
|
210
|
+
function_description = config.topic
|
|
211
|
+
|
|
212
|
+
elif isinstance(function, Function):
|
|
213
|
+
function_description = function.description
|
|
214
|
+
|
|
215
|
+
return function_description
|
|
216
|
+
|
|
217
|
+
|
|
218
|
+
def register_function_with_mcp(mcp: FastMCP, function_name: str, function: FunctionBase) -> None:
|
|
219
|
+
"""Register an AIQ Function as an MCP tool.
|
|
220
|
+
|
|
221
|
+
Args:
|
|
222
|
+
mcp: The FastMCP instance
|
|
223
|
+
function_name: The name to register the function under
|
|
224
|
+
function: The AIQ Function to register
|
|
225
|
+
"""
|
|
226
|
+
logger.info("Registering function %s with MCP", function_name)
|
|
227
|
+
|
|
228
|
+
# Get the input schema from the function
|
|
229
|
+
input_schema = function.input_schema
|
|
230
|
+
logger.info("Function %s has input schema: %s", function_name, input_schema)
|
|
231
|
+
|
|
232
|
+
# Check if we're dealing with a Workflow
|
|
233
|
+
is_workflow = isinstance(function, Workflow)
|
|
234
|
+
if is_workflow:
|
|
235
|
+
logger.info("Function %s is a Workflow", function_name)
|
|
236
|
+
|
|
237
|
+
# Get function description
|
|
238
|
+
function_description = get_function_description(function)
|
|
239
|
+
|
|
240
|
+
# Create and register the wrapper function with MCP
|
|
241
|
+
wrapper_func = create_function_wrapper(function_name, function, input_schema, is_workflow)
|
|
242
|
+
mcp.tool(name=function_name, description=function_description)(wrapper_func)
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
# pylint: disable=unused-import
|
|
17
|
+
# flake8: noqa
|
|
18
|
+
# isort:skip_file
|
|
19
|
+
|
|
20
|
+
from .console import register as console_register
|
|
21
|
+
from .fastapi import register as fastapi_register
|
|
22
|
+
from .mcp import register as mcp_register
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import logging
|
|
17
|
+
from abc import ABC
|
|
18
|
+
from abc import abstractmethod
|
|
19
|
+
from io import StringIO
|
|
20
|
+
|
|
21
|
+
import click
|
|
22
|
+
|
|
23
|
+
from aiq.builder.front_end import FrontEndBase
|
|
24
|
+
from aiq.builder.workflow_builder import WorkflowBuilder
|
|
25
|
+
from aiq.data_models.front_end import FrontEndConfigT
|
|
26
|
+
from aiq.runtime.session import AIQSessionManager
|
|
27
|
+
|
|
28
|
+
logger = logging.getLogger(__name__)
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
class SimpleFrontEndPluginBase(FrontEndBase[FrontEndConfigT], ABC):
|
|
32
|
+
|
|
33
|
+
async def pre_run(self):
|
|
34
|
+
pass
|
|
35
|
+
|
|
36
|
+
async def run(self):
|
|
37
|
+
|
|
38
|
+
# Must yield the workflow function otherwise it cleans up
|
|
39
|
+
async with WorkflowBuilder.from_config(config=self.full_config) as builder:
|
|
40
|
+
|
|
41
|
+
if logger.isEnabledFor(logging.INFO):
|
|
42
|
+
stream = StringIO()
|
|
43
|
+
|
|
44
|
+
self.full_config.print_summary(stream=stream)
|
|
45
|
+
|
|
46
|
+
click.echo(stream.getvalue())
|
|
47
|
+
|
|
48
|
+
workflow = builder.build()
|
|
49
|
+
session_manager = AIQSessionManager(workflow)
|
|
50
|
+
await self.run_workflow(session_manager)
|
|
51
|
+
|
|
52
|
+
@abstractmethod
|
|
53
|
+
async def run_workflow(self, session_manager: AIQSessionManager):
|
|
54
|
+
pass
|
aiq/llm/__init__.py
ADDED
|
File without changes
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import AliasChoices
|
|
17
|
+
from pydantic import ConfigDict
|
|
18
|
+
from pydantic import Field
|
|
19
|
+
|
|
20
|
+
from aiq.builder.builder import Builder
|
|
21
|
+
from aiq.builder.llm import LLMProviderInfo
|
|
22
|
+
from aiq.cli.register_workflow import register_llm_provider
|
|
23
|
+
from aiq.data_models.llm import LLMBaseConfig
|
|
24
|
+
from aiq.data_models.retry_mixin import RetryMixin
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
class AWSBedrockModelConfig(LLMBaseConfig, RetryMixin, name="aws_bedrock"):
|
|
28
|
+
"""An AWS Bedrock llm provider to be used with an LLM client."""
|
|
29
|
+
|
|
30
|
+
model_config = ConfigDict(protected_namespaces=())
|
|
31
|
+
|
|
32
|
+
# Completion parameters
|
|
33
|
+
model_name: str = Field(validation_alias=AliasChoices("model_name", "model"),
|
|
34
|
+
serialization_alias="model",
|
|
35
|
+
description="The model name for the hosted AWS Bedrock.")
|
|
36
|
+
temperature: float = Field(default=0.0, ge=0.0, le=1.0, description="Sampling temperature in [0, 1].")
|
|
37
|
+
max_tokens: int | None = Field(default=1024,
|
|
38
|
+
gt=0,
|
|
39
|
+
description="Maximum number of tokens to generate."
|
|
40
|
+
"This field is ONLY required when using AWS Bedrock with Langchain.")
|
|
41
|
+
context_size: int | None = Field(default=1024,
|
|
42
|
+
gt=0,
|
|
43
|
+
description="Maximum number of tokens to generate."
|
|
44
|
+
"This field is ONLY required when using AWS Bedrock with LlamaIndex.")
|
|
45
|
+
|
|
46
|
+
# Client parameters
|
|
47
|
+
region_name: str | None = Field(default="None", description="AWS region to use.")
|
|
48
|
+
base_url: str | None = Field(
|
|
49
|
+
default=None, description="Bedrock endpoint to use. Needed if you don't want to default to us-east-1 endpoint.")
|
|
50
|
+
credentials_profile_name: str | None = Field(
|
|
51
|
+
default=None, description="The name of the profile in the ~/.aws/credentials or ~/.aws/config files.")
|
|
52
|
+
|
|
53
|
+
|
|
54
|
+
@register_llm_provider(config_type=AWSBedrockModelConfig)
|
|
55
|
+
async def aws_bedrock_model(llm_config: AWSBedrockModelConfig, builder: Builder):
|
|
56
|
+
|
|
57
|
+
yield LLMProviderInfo(config=llm_config, description="A AWS Bedrock model for use with an LLM client.")
|
aiq/llm/nim_llm.py
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import AliasChoices
|
|
17
|
+
from pydantic import ConfigDict
|
|
18
|
+
from pydantic import Field
|
|
19
|
+
from pydantic import PositiveInt
|
|
20
|
+
|
|
21
|
+
from aiq.builder.builder import Builder
|
|
22
|
+
from aiq.builder.llm import LLMProviderInfo
|
|
23
|
+
from aiq.cli.register_workflow import register_llm_provider
|
|
24
|
+
from aiq.data_models.llm import LLMBaseConfig
|
|
25
|
+
from aiq.data_models.retry_mixin import RetryMixin
|
|
26
|
+
|
|
27
|
+
|
|
28
|
+
class NIMModelConfig(LLMBaseConfig, RetryMixin, name="nim"):
|
|
29
|
+
"""An NVIDIA Inference Microservice (NIM) llm provider to be used with an LLM client."""
|
|
30
|
+
|
|
31
|
+
model_config = ConfigDict(protected_namespaces=())
|
|
32
|
+
|
|
33
|
+
api_key: str | None = Field(default=None, description="NVIDIA API key to interact with hosted NIM.")
|
|
34
|
+
base_url: str | None = Field(default=None, description="Base url to the hosted NIM.")
|
|
35
|
+
model_name: str = Field(validation_alias=AliasChoices("model_name", "model"),
|
|
36
|
+
serialization_alias="model",
|
|
37
|
+
description="The model name for the hosted NIM.")
|
|
38
|
+
temperature: float = Field(default=0.0, description="Sampling temperature in [0, 1].")
|
|
39
|
+
top_p: float = Field(default=1.0, description="Top-p for distribution sampling.")
|
|
40
|
+
max_tokens: PositiveInt = Field(default=300, description="Maximum number of tokens to generate.")
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
@register_llm_provider(config_type=NIMModelConfig)
|
|
44
|
+
async def nim_model(llm_config: NIMModelConfig, builder: Builder):
|
|
45
|
+
|
|
46
|
+
yield LLMProviderInfo(config=llm_config, description="A NIM model for use with an LLM client.")
|
aiq/llm/openai_llm.py
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from pydantic import AliasChoices
|
|
17
|
+
from pydantic import ConfigDict
|
|
18
|
+
from pydantic import Field
|
|
19
|
+
|
|
20
|
+
from aiq.builder.builder import Builder
|
|
21
|
+
from aiq.builder.llm import LLMProviderInfo
|
|
22
|
+
from aiq.cli.register_workflow import register_llm_provider
|
|
23
|
+
from aiq.data_models.llm import LLMBaseConfig
|
|
24
|
+
from aiq.data_models.retry_mixin import RetryMixin
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
class OpenAIModelConfig(LLMBaseConfig, RetryMixin, name="openai"):
|
|
28
|
+
"""An OpenAI LLM provider to be used with an LLM client."""
|
|
29
|
+
|
|
30
|
+
model_config = ConfigDict(protected_namespaces=(), extra="allow")
|
|
31
|
+
|
|
32
|
+
api_key: str | None = Field(default=None, description="OpenAI API key to interact with hosted model.")
|
|
33
|
+
base_url: str | None = Field(default=None, description="Base url to the hosted model.")
|
|
34
|
+
model_name: str = Field(validation_alias=AliasChoices("model_name", "model"),
|
|
35
|
+
serialization_alias="model",
|
|
36
|
+
description="The OpenAI hosted model name.")
|
|
37
|
+
temperature: float = Field(default=0.0, description="Sampling temperature in [0, 1].")
|
|
38
|
+
top_p: float = Field(default=1.0, description="Top-p for distribution sampling.")
|
|
39
|
+
seed: int | None = Field(default=None, description="Random seed to set for generation.")
|
|
40
|
+
max_retries: int = Field(default=10, description="The max number of retries for the request.")
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
@register_llm_provider(config_type=OpenAIModelConfig)
|
|
44
|
+
async def openai_llm(config: OpenAIModelConfig, builder: Builder):
|
|
45
|
+
|
|
46
|
+
yield LLMProviderInfo(config=config, description="An OpenAI model for use with an LLM client.")
|
aiq/llm/register.py
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
# pylint: disable=unused-import
|
|
17
|
+
# flake8: noqa
|
|
18
|
+
# isort:skip_file
|
|
19
|
+
|
|
20
|
+
# Import any providers which need to be automatically registered here
|
|
21
|
+
from . import aws_bedrock_llm
|
|
22
|
+
from . import nim_llm
|
|
23
|
+
from . import openai_llm
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
@@ -0,0 +1,94 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import os
|
|
17
|
+
from abc import ABC
|
|
18
|
+
from enum import Enum
|
|
19
|
+
|
|
20
|
+
|
|
21
|
+
class EnvConfigValueSource(Enum):
|
|
22
|
+
ENV_DEFAULT = 1
|
|
23
|
+
CONSTRUCTOR = 2
|
|
24
|
+
ENV_OVERRIDE = 3
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
class EnvConfigValue(ABC):
|
|
28
|
+
"""
|
|
29
|
+
A wrapper for a string used as a configuration value which can be loaded from the system environment or injected via
|
|
30
|
+
the constructor. This class should be subclassed and the class fields `_ENV_KEY` and `_ENV_KEY_OVERRIDE` can be set
|
|
31
|
+
to enable environment-loading functionality. Convienience properties are available to check from where the value was
|
|
32
|
+
loaded.
|
|
33
|
+
"""
|
|
34
|
+
|
|
35
|
+
_ENV_KEY: str | None = None
|
|
36
|
+
_ENV_KEY_OVERRIDE: str | None = None
|
|
37
|
+
_ALLOW_NONE: bool = False
|
|
38
|
+
|
|
39
|
+
def __init__(self, value: str | None = None, use_env: bool = True):
|
|
40
|
+
"""
|
|
41
|
+
Parameters
|
|
42
|
+
----------
|
|
43
|
+
value : str, optional
|
|
44
|
+
The value to be contained in the EnvConfigValue. If the value is `None`, an attempt will be made to load it
|
|
45
|
+
from the environment using `_ENV_KEY`. if the `_ENV_KEY_OVERRIDE` field is not `None`, an attempt will be
|
|
46
|
+
made to load that environment variable in place of the passed-in value.
|
|
47
|
+
use_env : bool
|
|
48
|
+
If False, all environment-loading logic will be bypassed and the passed-in value will be used as-is.
|
|
49
|
+
defaults to True.
|
|
50
|
+
"""
|
|
51
|
+
|
|
52
|
+
self._source = EnvConfigValueSource.CONSTRUCTOR
|
|
53
|
+
|
|
54
|
+
if use_env:
|
|
55
|
+
if value is None and self.__class__._ENV_KEY is not None:
|
|
56
|
+
value = os.environ.get(self.__class__._ENV_KEY, None)
|
|
57
|
+
self._source = EnvConfigValueSource.ENV_DEFAULT
|
|
58
|
+
|
|
59
|
+
if self.__class__._ENV_KEY_OVERRIDE is not None and self.__class__._ENV_KEY_OVERRIDE in os.environ:
|
|
60
|
+
value = os.environ[self.__class__._ENV_KEY_OVERRIDE]
|
|
61
|
+
self._source = EnvConfigValueSource.ENV_OVERRIDE
|
|
62
|
+
|
|
63
|
+
if not self.__class__._ALLOW_NONE and value is None:
|
|
64
|
+
|
|
65
|
+
message = ("value must not be None, but provided value was None and no environment-based default or "
|
|
66
|
+
"override was found.")
|
|
67
|
+
|
|
68
|
+
if self.__class__._ENV_KEY is None:
|
|
69
|
+
raise ValueError(message)
|
|
70
|
+
|
|
71
|
+
raise ValueError(
|
|
72
|
+
f"{message} Try passing a value to the constructor, or setting the `{self.__class__._ENV_KEY}` "
|
|
73
|
+
"environment variable.")
|
|
74
|
+
|
|
75
|
+
else:
|
|
76
|
+
if not self.__class__._ALLOW_NONE and value is None:
|
|
77
|
+
raise ValueError("value must not be none")
|
|
78
|
+
|
|
79
|
+
assert isinstance(value, str) or value is None
|
|
80
|
+
|
|
81
|
+
self._value = value
|
|
82
|
+
self._use_env = use_env
|
|
83
|
+
|
|
84
|
+
@property
|
|
85
|
+
def source(self) -> EnvConfigValueSource:
|
|
86
|
+
return self._source
|
|
87
|
+
|
|
88
|
+
@property
|
|
89
|
+
def use_env(self) -> bool:
|
|
90
|
+
return self._use_env
|
|
91
|
+
|
|
92
|
+
@property
|
|
93
|
+
def value(self) -> str | None:
|
|
94
|
+
return self._value
|
aiq/llm/utils/error.py
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
IMPORT_ERROR_MESSAGE = (
|
|
17
|
+
"{package} not found. Install it and other additional dependencies by running the following command:\n")
|
aiq/memory/__init__.py
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
"""
|
|
16
|
+
AIQ Toolkit Memory Module
|
|
17
|
+
|
|
18
|
+
This package provides foundational classes and interfaces
|
|
19
|
+
for managing text-based memory in AIQ Toolkit's LLM-based agents.
|
|
20
|
+
"""
|