nvidia-nat 1.2.0rc5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- aiq/agent/__init__.py +0 -0
- aiq/agent/base.py +239 -0
- aiq/agent/dual_node.py +67 -0
- aiq/agent/react_agent/__init__.py +0 -0
- aiq/agent/react_agent/agent.py +355 -0
- aiq/agent/react_agent/output_parser.py +104 -0
- aiq/agent/react_agent/prompt.py +41 -0
- aiq/agent/react_agent/register.py +149 -0
- aiq/agent/reasoning_agent/__init__.py +0 -0
- aiq/agent/reasoning_agent/reasoning_agent.py +225 -0
- aiq/agent/register.py +23 -0
- aiq/agent/rewoo_agent/__init__.py +0 -0
- aiq/agent/rewoo_agent/agent.py +411 -0
- aiq/agent/rewoo_agent/prompt.py +108 -0
- aiq/agent/rewoo_agent/register.py +158 -0
- aiq/agent/tool_calling_agent/__init__.py +0 -0
- aiq/agent/tool_calling_agent/agent.py +119 -0
- aiq/agent/tool_calling_agent/register.py +106 -0
- aiq/authentication/__init__.py +14 -0
- aiq/authentication/api_key/__init__.py +14 -0
- aiq/authentication/api_key/api_key_auth_provider.py +96 -0
- aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
- aiq/authentication/api_key/register.py +26 -0
- aiq/authentication/exceptions/__init__.py +14 -0
- aiq/authentication/exceptions/api_key_exceptions.py +38 -0
- aiq/authentication/http_basic_auth/__init__.py +0 -0
- aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
- aiq/authentication/http_basic_auth/register.py +30 -0
- aiq/authentication/interfaces.py +93 -0
- aiq/authentication/oauth2/__init__.py +14 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
- aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
- aiq/authentication/oauth2/register.py +25 -0
- aiq/authentication/register.py +21 -0
- aiq/builder/__init__.py +0 -0
- aiq/builder/builder.py +285 -0
- aiq/builder/component_utils.py +316 -0
- aiq/builder/context.py +264 -0
- aiq/builder/embedder.py +24 -0
- aiq/builder/eval_builder.py +161 -0
- aiq/builder/evaluator.py +29 -0
- aiq/builder/framework_enum.py +24 -0
- aiq/builder/front_end.py +73 -0
- aiq/builder/function.py +344 -0
- aiq/builder/function_base.py +380 -0
- aiq/builder/function_info.py +627 -0
- aiq/builder/intermediate_step_manager.py +174 -0
- aiq/builder/llm.py +25 -0
- aiq/builder/retriever.py +25 -0
- aiq/builder/user_interaction_manager.py +74 -0
- aiq/builder/workflow.py +148 -0
- aiq/builder/workflow_builder.py +1117 -0
- aiq/cli/__init__.py +14 -0
- aiq/cli/cli_utils/__init__.py +0 -0
- aiq/cli/cli_utils/config_override.py +231 -0
- aiq/cli/cli_utils/validation.py +37 -0
- aiq/cli/commands/__init__.py +0 -0
- aiq/cli/commands/configure/__init__.py +0 -0
- aiq/cli/commands/configure/channel/__init__.py +0 -0
- aiq/cli/commands/configure/channel/add.py +28 -0
- aiq/cli/commands/configure/channel/channel.py +36 -0
- aiq/cli/commands/configure/channel/remove.py +30 -0
- aiq/cli/commands/configure/channel/update.py +30 -0
- aiq/cli/commands/configure/configure.py +33 -0
- aiq/cli/commands/evaluate.py +139 -0
- aiq/cli/commands/info/__init__.py +14 -0
- aiq/cli/commands/info/info.py +39 -0
- aiq/cli/commands/info/list_channels.py +32 -0
- aiq/cli/commands/info/list_components.py +129 -0
- aiq/cli/commands/info/list_mcp.py +213 -0
- aiq/cli/commands/registry/__init__.py +14 -0
- aiq/cli/commands/registry/publish.py +88 -0
- aiq/cli/commands/registry/pull.py +118 -0
- aiq/cli/commands/registry/registry.py +38 -0
- aiq/cli/commands/registry/remove.py +108 -0
- aiq/cli/commands/registry/search.py +155 -0
- aiq/cli/commands/sizing/__init__.py +14 -0
- aiq/cli/commands/sizing/calc.py +297 -0
- aiq/cli/commands/sizing/sizing.py +27 -0
- aiq/cli/commands/start.py +246 -0
- aiq/cli/commands/uninstall.py +81 -0
- aiq/cli/commands/validate.py +47 -0
- aiq/cli/commands/workflow/__init__.py +14 -0
- aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
- aiq/cli/commands/workflow/templates/config.yml.j2 +16 -0
- aiq/cli/commands/workflow/templates/pyproject.toml.j2 +22 -0
- aiq/cli/commands/workflow/templates/register.py.j2 +5 -0
- aiq/cli/commands/workflow/templates/workflow.py.j2 +36 -0
- aiq/cli/commands/workflow/workflow.py +37 -0
- aiq/cli/commands/workflow/workflow_commands.py +313 -0
- aiq/cli/entrypoint.py +135 -0
- aiq/cli/main.py +44 -0
- aiq/cli/register_workflow.py +488 -0
- aiq/cli/type_registry.py +1000 -0
- aiq/data_models/__init__.py +14 -0
- aiq/data_models/api_server.py +694 -0
- aiq/data_models/authentication.py +231 -0
- aiq/data_models/common.py +171 -0
- aiq/data_models/component.py +54 -0
- aiq/data_models/component_ref.py +168 -0
- aiq/data_models/config.py +406 -0
- aiq/data_models/dataset_handler.py +123 -0
- aiq/data_models/discovery_metadata.py +335 -0
- aiq/data_models/embedder.py +27 -0
- aiq/data_models/evaluate.py +127 -0
- aiq/data_models/evaluator.py +26 -0
- aiq/data_models/front_end.py +26 -0
- aiq/data_models/function.py +30 -0
- aiq/data_models/function_dependencies.py +72 -0
- aiq/data_models/interactive.py +246 -0
- aiq/data_models/intermediate_step.py +302 -0
- aiq/data_models/invocation_node.py +38 -0
- aiq/data_models/llm.py +27 -0
- aiq/data_models/logging.py +26 -0
- aiq/data_models/memory.py +27 -0
- aiq/data_models/object_store.py +44 -0
- aiq/data_models/profiler.py +54 -0
- aiq/data_models/registry_handler.py +26 -0
- aiq/data_models/retriever.py +30 -0
- aiq/data_models/retry_mixin.py +35 -0
- aiq/data_models/span.py +187 -0
- aiq/data_models/step_adaptor.py +64 -0
- aiq/data_models/streaming.py +33 -0
- aiq/data_models/swe_bench_model.py +54 -0
- aiq/data_models/telemetry_exporter.py +26 -0
- aiq/data_models/ttc_strategy.py +30 -0
- aiq/embedder/__init__.py +0 -0
- aiq/embedder/langchain_client.py +41 -0
- aiq/embedder/nim_embedder.py +59 -0
- aiq/embedder/openai_embedder.py +43 -0
- aiq/embedder/register.py +24 -0
- aiq/eval/__init__.py +14 -0
- aiq/eval/config.py +60 -0
- aiq/eval/dataset_handler/__init__.py +0 -0
- aiq/eval/dataset_handler/dataset_downloader.py +106 -0
- aiq/eval/dataset_handler/dataset_filter.py +52 -0
- aiq/eval/dataset_handler/dataset_handler.py +254 -0
- aiq/eval/evaluate.py +506 -0
- aiq/eval/evaluator/__init__.py +14 -0
- aiq/eval/evaluator/base_evaluator.py +73 -0
- aiq/eval/evaluator/evaluator_model.py +45 -0
- aiq/eval/intermediate_step_adapter.py +99 -0
- aiq/eval/rag_evaluator/__init__.py +0 -0
- aiq/eval/rag_evaluator/evaluate.py +178 -0
- aiq/eval/rag_evaluator/register.py +143 -0
- aiq/eval/register.py +23 -0
- aiq/eval/remote_workflow.py +133 -0
- aiq/eval/runners/__init__.py +14 -0
- aiq/eval/runners/config.py +39 -0
- aiq/eval/runners/multi_eval_runner.py +54 -0
- aiq/eval/runtime_event_subscriber.py +52 -0
- aiq/eval/swe_bench_evaluator/__init__.py +0 -0
- aiq/eval/swe_bench_evaluator/evaluate.py +215 -0
- aiq/eval/swe_bench_evaluator/register.py +36 -0
- aiq/eval/trajectory_evaluator/__init__.py +0 -0
- aiq/eval/trajectory_evaluator/evaluate.py +75 -0
- aiq/eval/trajectory_evaluator/register.py +40 -0
- aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
- aiq/eval/tunable_rag_evaluator/evaluate.py +245 -0
- aiq/eval/tunable_rag_evaluator/register.py +52 -0
- aiq/eval/usage_stats.py +41 -0
- aiq/eval/utils/__init__.py +0 -0
- aiq/eval/utils/output_uploader.py +140 -0
- aiq/eval/utils/tqdm_position_registry.py +40 -0
- aiq/eval/utils/weave_eval.py +184 -0
- aiq/experimental/__init__.py +0 -0
- aiq/experimental/decorators/__init__.py +0 -0
- aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
- aiq/experimental/test_time_compute/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/__init__.py +0 -0
- aiq/experimental/test_time_compute/editing/iterative_plan_refinement_editor.py +147 -0
- aiq/experimental/test_time_compute/editing/llm_as_a_judge_editor.py +204 -0
- aiq/experimental/test_time_compute/editing/motivation_aware_summarization.py +107 -0
- aiq/experimental/test_time_compute/functions/__init__.py +0 -0
- aiq/experimental/test_time_compute/functions/execute_score_select_function.py +105 -0
- aiq/experimental/test_time_compute/functions/its_tool_orchestration_function.py +205 -0
- aiq/experimental/test_time_compute/functions/its_tool_wrapper_function.py +146 -0
- aiq/experimental/test_time_compute/functions/plan_select_execute_function.py +224 -0
- aiq/experimental/test_time_compute/models/__init__.py +0 -0
- aiq/experimental/test_time_compute/models/editor_config.py +132 -0
- aiq/experimental/test_time_compute/models/scoring_config.py +112 -0
- aiq/experimental/test_time_compute/models/search_config.py +120 -0
- aiq/experimental/test_time_compute/models/selection_config.py +154 -0
- aiq/experimental/test_time_compute/models/stage_enums.py +43 -0
- aiq/experimental/test_time_compute/models/strategy_base.py +66 -0
- aiq/experimental/test_time_compute/models/tool_use_config.py +41 -0
- aiq/experimental/test_time_compute/models/ttc_item.py +48 -0
- aiq/experimental/test_time_compute/register.py +36 -0
- aiq/experimental/test_time_compute/scoring/__init__.py +0 -0
- aiq/experimental/test_time_compute/scoring/llm_based_agent_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/llm_based_plan_scorer.py +168 -0
- aiq/experimental/test_time_compute/scoring/motivation_aware_scorer.py +111 -0
- aiq/experimental/test_time_compute/search/__init__.py +0 -0
- aiq/experimental/test_time_compute/search/multi_llm_planner.py +128 -0
- aiq/experimental/test_time_compute/search/multi_query_retrieval_search.py +122 -0
- aiq/experimental/test_time_compute/search/single_shot_multi_plan_planner.py +128 -0
- aiq/experimental/test_time_compute/selection/__init__.py +0 -0
- aiq/experimental/test_time_compute/selection/best_of_n_selector.py +63 -0
- aiq/experimental/test_time_compute/selection/llm_based_agent_output_selector.py +131 -0
- aiq/experimental/test_time_compute/selection/llm_based_output_merging_selector.py +159 -0
- aiq/experimental/test_time_compute/selection/llm_based_plan_selector.py +128 -0
- aiq/experimental/test_time_compute/selection/threshold_selector.py +58 -0
- aiq/front_ends/__init__.py +14 -0
- aiq/front_ends/console/__init__.py +14 -0
- aiq/front_ends/console/authentication_flow_handler.py +233 -0
- aiq/front_ends/console/console_front_end_config.py +32 -0
- aiq/front_ends/console/console_front_end_plugin.py +96 -0
- aiq/front_ends/console/register.py +25 -0
- aiq/front_ends/cron/__init__.py +14 -0
- aiq/front_ends/fastapi/__init__.py +14 -0
- aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
- aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
- aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
- aiq/front_ends/fastapi/fastapi_front_end_config.py +234 -0
- aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin.py +116 -0
- aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +1092 -0
- aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
- aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
- aiq/front_ends/fastapi/intermediate_steps_subscriber.py +80 -0
- aiq/front_ends/fastapi/job_store.py +183 -0
- aiq/front_ends/fastapi/main.py +72 -0
- aiq/front_ends/fastapi/message_handler.py +298 -0
- aiq/front_ends/fastapi/message_validator.py +345 -0
- aiq/front_ends/fastapi/register.py +25 -0
- aiq/front_ends/fastapi/response_helpers.py +195 -0
- aiq/front_ends/fastapi/step_adaptor.py +321 -0
- aiq/front_ends/mcp/__init__.py +14 -0
- aiq/front_ends/mcp/mcp_front_end_config.py +32 -0
- aiq/front_ends/mcp/mcp_front_end_plugin.py +93 -0
- aiq/front_ends/mcp/register.py +27 -0
- aiq/front_ends/mcp/tool_converter.py +242 -0
- aiq/front_ends/register.py +22 -0
- aiq/front_ends/simple_base/__init__.py +14 -0
- aiq/front_ends/simple_base/simple_front_end_plugin_base.py +54 -0
- aiq/llm/__init__.py +0 -0
- aiq/llm/aws_bedrock_llm.py +57 -0
- aiq/llm/nim_llm.py +46 -0
- aiq/llm/openai_llm.py +46 -0
- aiq/llm/register.py +23 -0
- aiq/llm/utils/__init__.py +14 -0
- aiq/llm/utils/env_config_value.py +94 -0
- aiq/llm/utils/error.py +17 -0
- aiq/memory/__init__.py +20 -0
- aiq/memory/interfaces.py +183 -0
- aiq/memory/models.py +112 -0
- aiq/meta/module_to_distro.json +3 -0
- aiq/meta/pypi.md +58 -0
- aiq/object_store/__init__.py +20 -0
- aiq/object_store/in_memory_object_store.py +76 -0
- aiq/object_store/interfaces.py +84 -0
- aiq/object_store/models.py +36 -0
- aiq/object_store/register.py +20 -0
- aiq/observability/__init__.py +14 -0
- aiq/observability/exporter/__init__.py +14 -0
- aiq/observability/exporter/base_exporter.py +449 -0
- aiq/observability/exporter/exporter.py +78 -0
- aiq/observability/exporter/file_exporter.py +33 -0
- aiq/observability/exporter/processing_exporter.py +322 -0
- aiq/observability/exporter/raw_exporter.py +52 -0
- aiq/observability/exporter/span_exporter.py +265 -0
- aiq/observability/exporter_manager.py +335 -0
- aiq/observability/mixin/__init__.py +14 -0
- aiq/observability/mixin/batch_config_mixin.py +26 -0
- aiq/observability/mixin/collector_config_mixin.py +23 -0
- aiq/observability/mixin/file_mixin.py +288 -0
- aiq/observability/mixin/file_mode.py +23 -0
- aiq/observability/mixin/resource_conflict_mixin.py +134 -0
- aiq/observability/mixin/serialize_mixin.py +61 -0
- aiq/observability/mixin/type_introspection_mixin.py +183 -0
- aiq/observability/processor/__init__.py +14 -0
- aiq/observability/processor/batching_processor.py +310 -0
- aiq/observability/processor/callback_processor.py +42 -0
- aiq/observability/processor/intermediate_step_serializer.py +28 -0
- aiq/observability/processor/processor.py +71 -0
- aiq/observability/register.py +96 -0
- aiq/observability/utils/__init__.py +14 -0
- aiq/observability/utils/dict_utils.py +236 -0
- aiq/observability/utils/time_utils.py +31 -0
- aiq/plugins/.namespace +1 -0
- aiq/profiler/__init__.py +0 -0
- aiq/profiler/calc/__init__.py +14 -0
- aiq/profiler/calc/calc_runner.py +627 -0
- aiq/profiler/calc/calculations.py +288 -0
- aiq/profiler/calc/data_models.py +188 -0
- aiq/profiler/calc/plot.py +345 -0
- aiq/profiler/callbacks/__init__.py +0 -0
- aiq/profiler/callbacks/agno_callback_handler.py +295 -0
- aiq/profiler/callbacks/base_callback_class.py +20 -0
- aiq/profiler/callbacks/langchain_callback_handler.py +290 -0
- aiq/profiler/callbacks/llama_index_callback_handler.py +205 -0
- aiq/profiler/callbacks/semantic_kernel_callback_handler.py +238 -0
- aiq/profiler/callbacks/token_usage_base_model.py +27 -0
- aiq/profiler/data_frame_row.py +51 -0
- aiq/profiler/data_models.py +24 -0
- aiq/profiler/decorators/__init__.py +0 -0
- aiq/profiler/decorators/framework_wrapper.py +131 -0
- aiq/profiler/decorators/function_tracking.py +254 -0
- aiq/profiler/forecasting/__init__.py +0 -0
- aiq/profiler/forecasting/config.py +18 -0
- aiq/profiler/forecasting/model_trainer.py +75 -0
- aiq/profiler/forecasting/models/__init__.py +22 -0
- aiq/profiler/forecasting/models/forecasting_base_model.py +40 -0
- aiq/profiler/forecasting/models/linear_model.py +196 -0
- aiq/profiler/forecasting/models/random_forest_regressor.py +268 -0
- aiq/profiler/inference_metrics_model.py +28 -0
- aiq/profiler/inference_optimization/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +460 -0
- aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +258 -0
- aiq/profiler/inference_optimization/data_models.py +386 -0
- aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
- aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +468 -0
- aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +405 -0
- aiq/profiler/inference_optimization/llm_metrics.py +212 -0
- aiq/profiler/inference_optimization/prompt_caching.py +163 -0
- aiq/profiler/inference_optimization/token_uniqueness.py +107 -0
- aiq/profiler/inference_optimization/workflow_runtimes.py +72 -0
- aiq/profiler/intermediate_property_adapter.py +102 -0
- aiq/profiler/profile_runner.py +473 -0
- aiq/profiler/utils.py +184 -0
- aiq/registry_handlers/__init__.py +0 -0
- aiq/registry_handlers/local/__init__.py +0 -0
- aiq/registry_handlers/local/local_handler.py +176 -0
- aiq/registry_handlers/local/register_local.py +37 -0
- aiq/registry_handlers/metadata_factory.py +60 -0
- aiq/registry_handlers/package_utils.py +567 -0
- aiq/registry_handlers/pypi/__init__.py +0 -0
- aiq/registry_handlers/pypi/pypi_handler.py +251 -0
- aiq/registry_handlers/pypi/register_pypi.py +40 -0
- aiq/registry_handlers/register.py +21 -0
- aiq/registry_handlers/registry_handler_base.py +157 -0
- aiq/registry_handlers/rest/__init__.py +0 -0
- aiq/registry_handlers/rest/register_rest.py +56 -0
- aiq/registry_handlers/rest/rest_handler.py +237 -0
- aiq/registry_handlers/schemas/__init__.py +0 -0
- aiq/registry_handlers/schemas/headers.py +42 -0
- aiq/registry_handlers/schemas/package.py +68 -0
- aiq/registry_handlers/schemas/publish.py +63 -0
- aiq/registry_handlers/schemas/pull.py +82 -0
- aiq/registry_handlers/schemas/remove.py +36 -0
- aiq/registry_handlers/schemas/search.py +91 -0
- aiq/registry_handlers/schemas/status.py +47 -0
- aiq/retriever/__init__.py +0 -0
- aiq/retriever/interface.py +37 -0
- aiq/retriever/milvus/__init__.py +14 -0
- aiq/retriever/milvus/register.py +81 -0
- aiq/retriever/milvus/retriever.py +228 -0
- aiq/retriever/models.py +74 -0
- aiq/retriever/nemo_retriever/__init__.py +14 -0
- aiq/retriever/nemo_retriever/register.py +60 -0
- aiq/retriever/nemo_retriever/retriever.py +190 -0
- aiq/retriever/register.py +22 -0
- aiq/runtime/__init__.py +14 -0
- aiq/runtime/loader.py +215 -0
- aiq/runtime/runner.py +190 -0
- aiq/runtime/session.py +158 -0
- aiq/runtime/user_metadata.py +130 -0
- aiq/settings/__init__.py +0 -0
- aiq/settings/global_settings.py +318 -0
- aiq/test/.namespace +1 -0
- aiq/tool/__init__.py +0 -0
- aiq/tool/chat_completion.py +74 -0
- aiq/tool/code_execution/README.md +151 -0
- aiq/tool/code_execution/__init__.py +0 -0
- aiq/tool/code_execution/code_sandbox.py +267 -0
- aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
- aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +60 -0
- aiq/tool/code_execution/local_sandbox/__init__.py +13 -0
- aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +198 -0
- aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +6 -0
- aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +50 -0
- aiq/tool/code_execution/register.py +74 -0
- aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
- aiq/tool/code_execution/utils.py +100 -0
- aiq/tool/datetime_tools.py +42 -0
- aiq/tool/document_search.py +141 -0
- aiq/tool/github_tools/__init__.py +0 -0
- aiq/tool/github_tools/create_github_commit.py +133 -0
- aiq/tool/github_tools/create_github_issue.py +87 -0
- aiq/tool/github_tools/create_github_pr.py +106 -0
- aiq/tool/github_tools/get_github_file.py +106 -0
- aiq/tool/github_tools/get_github_issue.py +166 -0
- aiq/tool/github_tools/get_github_pr.py +256 -0
- aiq/tool/github_tools/update_github_issue.py +100 -0
- aiq/tool/mcp/__init__.py +14 -0
- aiq/tool/mcp/exceptions.py +142 -0
- aiq/tool/mcp/mcp_client.py +255 -0
- aiq/tool/mcp/mcp_tool.py +96 -0
- aiq/tool/memory_tools/__init__.py +0 -0
- aiq/tool/memory_tools/add_memory_tool.py +79 -0
- aiq/tool/memory_tools/delete_memory_tool.py +67 -0
- aiq/tool/memory_tools/get_memory_tool.py +72 -0
- aiq/tool/nvidia_rag.py +95 -0
- aiq/tool/register.py +38 -0
- aiq/tool/retriever.py +89 -0
- aiq/tool/server_tools.py +66 -0
- aiq/utils/__init__.py +0 -0
- aiq/utils/data_models/__init__.py +0 -0
- aiq/utils/data_models/schema_validator.py +58 -0
- aiq/utils/debugging_utils.py +43 -0
- aiq/utils/dump_distro_mapping.py +32 -0
- aiq/utils/exception_handlers/__init__.py +0 -0
- aiq/utils/exception_handlers/automatic_retries.py +289 -0
- aiq/utils/exception_handlers/mcp.py +211 -0
- aiq/utils/exception_handlers/schemas.py +114 -0
- aiq/utils/io/__init__.py +0 -0
- aiq/utils/io/model_processing.py +28 -0
- aiq/utils/io/yaml_tools.py +119 -0
- aiq/utils/log_utils.py +37 -0
- aiq/utils/metadata_utils.py +74 -0
- aiq/utils/optional_imports.py +142 -0
- aiq/utils/producer_consumer_queue.py +178 -0
- aiq/utils/reactive/__init__.py +0 -0
- aiq/utils/reactive/base/__init__.py +0 -0
- aiq/utils/reactive/base/observable_base.py +65 -0
- aiq/utils/reactive/base/observer_base.py +55 -0
- aiq/utils/reactive/base/subject_base.py +79 -0
- aiq/utils/reactive/observable.py +59 -0
- aiq/utils/reactive/observer.py +76 -0
- aiq/utils/reactive/subject.py +131 -0
- aiq/utils/reactive/subscription.py +49 -0
- aiq/utils/settings/__init__.py +0 -0
- aiq/utils/settings/global_settings.py +197 -0
- aiq/utils/string_utils.py +38 -0
- aiq/utils/type_converter.py +290 -0
- aiq/utils/type_utils.py +484 -0
- aiq/utils/url_utils.py +27 -0
- nvidia_nat-1.2.0rc5.dist-info/METADATA +363 -0
- nvidia_nat-1.2.0rc5.dist-info/RECORD +435 -0
- nvidia_nat-1.2.0rc5.dist-info/WHEEL +5 -0
- nvidia_nat-1.2.0rc5.dist-info/entry_points.txt +20 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE-3rd-party.txt +3686 -0
- nvidia_nat-1.2.0rc5.dist-info/licenses/LICENSE.md +201 -0
- nvidia_nat-1.2.0rc5.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,694 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import abc
|
|
17
|
+
import datetime
|
|
18
|
+
import typing
|
|
19
|
+
import uuid
|
|
20
|
+
from abc import abstractmethod
|
|
21
|
+
from enum import Enum
|
|
22
|
+
|
|
23
|
+
from pydantic import BaseModel
|
|
24
|
+
from pydantic import ConfigDict
|
|
25
|
+
from pydantic import Discriminator
|
|
26
|
+
from pydantic import Field
|
|
27
|
+
from pydantic import HttpUrl
|
|
28
|
+
from pydantic import conlist
|
|
29
|
+
from pydantic import field_serializer
|
|
30
|
+
from pydantic import field_validator
|
|
31
|
+
from pydantic_core.core_schema import ValidationInfo
|
|
32
|
+
|
|
33
|
+
from aiq.data_models.interactive import HumanPrompt
|
|
34
|
+
from aiq.utils.type_converter import GlobalTypeConverter
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
class Request(BaseModel):
|
|
38
|
+
"""
|
|
39
|
+
Request is a data model that represents HTTP request attributes.
|
|
40
|
+
"""
|
|
41
|
+
model_config = ConfigDict(extra="forbid")
|
|
42
|
+
|
|
43
|
+
method: str | None = Field(default=None,
|
|
44
|
+
description="HTTP method used for the request (e.g., GET, POST, PUT, DELETE).")
|
|
45
|
+
url_path: str | None = Field(default=None, description="URL request path.")
|
|
46
|
+
url_port: int | None = Field(default=None, description="URL request port number.")
|
|
47
|
+
url_scheme: str | None = Field(default=None, description="URL scheme indicating the protocol (e.g., http, https).")
|
|
48
|
+
headers: typing.Any | None = Field(default=None, description="HTTP headers associated with the request.")
|
|
49
|
+
query_params: typing.Any | None = Field(default=None, description="Query parameters included in the request URL.")
|
|
50
|
+
path_params: dict[str, str] | None = Field(default=None,
|
|
51
|
+
description="Path parameters extracted from the request URL.")
|
|
52
|
+
client_host: str | None = Field(default=None, description="Client host address from which the request originated.")
|
|
53
|
+
client_port: int | None = Field(default=None, description="Client port number from which the request originated.")
|
|
54
|
+
cookies: dict[str, str] | None = Field(
|
|
55
|
+
default=None, description="Cookies sent with the request, stored in a dictionary-like object.")
|
|
56
|
+
|
|
57
|
+
|
|
58
|
+
class ChatContentType(str, Enum):
|
|
59
|
+
"""
|
|
60
|
+
ChatContentType is an Enum that represents the type of Chat content.
|
|
61
|
+
"""
|
|
62
|
+
TEXT = "text"
|
|
63
|
+
IMAGE_URL = "image_url"
|
|
64
|
+
INPUT_AUDIO = "input_audio"
|
|
65
|
+
|
|
66
|
+
|
|
67
|
+
class InputAudio(BaseModel):
|
|
68
|
+
data: str = "default"
|
|
69
|
+
format: str = "default"
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
class AudioContent(BaseModel):
|
|
73
|
+
model_config = ConfigDict(extra="forbid")
|
|
74
|
+
|
|
75
|
+
type: typing.Literal[ChatContentType.INPUT_AUDIO] = ChatContentType.INPUT_AUDIO
|
|
76
|
+
input_audio: InputAudio = InputAudio()
|
|
77
|
+
|
|
78
|
+
|
|
79
|
+
class ImageUrl(BaseModel):
|
|
80
|
+
url: HttpUrl = HttpUrl(url="http://default.com")
|
|
81
|
+
|
|
82
|
+
|
|
83
|
+
class ImageContent(BaseModel):
|
|
84
|
+
model_config = ConfigDict(extra="forbid")
|
|
85
|
+
|
|
86
|
+
type: typing.Literal[ChatContentType.IMAGE_URL] = ChatContentType.IMAGE_URL
|
|
87
|
+
image_url: ImageUrl = ImageUrl()
|
|
88
|
+
|
|
89
|
+
|
|
90
|
+
class TextContent(BaseModel):
|
|
91
|
+
model_config = ConfigDict(extra="forbid")
|
|
92
|
+
|
|
93
|
+
type: typing.Literal[ChatContentType.TEXT] = ChatContentType.TEXT
|
|
94
|
+
text: str = "default"
|
|
95
|
+
|
|
96
|
+
|
|
97
|
+
class Security(BaseModel):
|
|
98
|
+
model_config = ConfigDict(extra="forbid")
|
|
99
|
+
|
|
100
|
+
api_key: str = "default"
|
|
101
|
+
token: str = "default"
|
|
102
|
+
|
|
103
|
+
|
|
104
|
+
UserContent = typing.Annotated[TextContent | ImageContent | AudioContent, Discriminator("type")]
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
class Message(BaseModel):
|
|
108
|
+
content: str | list[UserContent]
|
|
109
|
+
role: str
|
|
110
|
+
|
|
111
|
+
|
|
112
|
+
class AIQChatRequest(BaseModel):
|
|
113
|
+
"""
|
|
114
|
+
AIQChatRequest is a data model that represents a request to the AIQ Toolkit chat API.
|
|
115
|
+
Fully compatible with OpenAI Chat Completions API specification.
|
|
116
|
+
"""
|
|
117
|
+
|
|
118
|
+
# Required fields
|
|
119
|
+
messages: typing.Annotated[list[Message], conlist(Message, min_length=1)]
|
|
120
|
+
|
|
121
|
+
# Optional fields (OpenAI Chat Completions API compatible)
|
|
122
|
+
model: str | None = Field(default=None, description="name of the model to use")
|
|
123
|
+
frequency_penalty: float | None = Field(default=0.0,
|
|
124
|
+
description="Penalty for new tokens based on frequency in text")
|
|
125
|
+
logit_bias: dict[str, float] | None = Field(default=None,
|
|
126
|
+
description="Modify likelihood of specified tokens appearing")
|
|
127
|
+
logprobs: bool | None = Field(default=None, description="Whether to return log probabilities")
|
|
128
|
+
top_logprobs: int | None = Field(default=None, description="Number of most likely tokens to return")
|
|
129
|
+
max_tokens: int | None = Field(default=None, description="Maximum number of tokens to generate")
|
|
130
|
+
n: int | None = Field(default=1, description="Number of chat completion choices to generate")
|
|
131
|
+
presence_penalty: float | None = Field(default=0.0, description="Penalty for new tokens based on presence in text")
|
|
132
|
+
response_format: dict[str, typing.Any] | None = Field(default=None, description="Response format specification")
|
|
133
|
+
seed: int | None = Field(default=None, description="Random seed for deterministic sampling")
|
|
134
|
+
service_tier: typing.Literal["auto", "default"] | None = Field(default=None,
|
|
135
|
+
description="Service tier for the request")
|
|
136
|
+
stream: bool | None = Field(default=False, description="Whether to stream partial message deltas")
|
|
137
|
+
stream_options: dict[str, typing.Any] | None = Field(default=None, description="Options for streaming")
|
|
138
|
+
temperature: float | None = Field(default=1.0, description="Sampling temperature between 0 and 2")
|
|
139
|
+
top_p: float | None = Field(default=None, description="Nucleus sampling parameter")
|
|
140
|
+
tools: list[dict[str, typing.Any]] | None = Field(default=None, description="List of tools the model may call")
|
|
141
|
+
tool_choice: str | dict[str, typing.Any] | None = Field(default=None, description="Controls which tool is called")
|
|
142
|
+
parallel_tool_calls: bool | None = Field(default=True, description="Whether to enable parallel function calling")
|
|
143
|
+
user: str | None = Field(default=None, description="Unique identifier representing end-user")
|
|
144
|
+
|
|
145
|
+
model_config = ConfigDict(extra="allow",
|
|
146
|
+
json_schema_extra={
|
|
147
|
+
"example": {
|
|
148
|
+
"model": "nvidia/nemotron",
|
|
149
|
+
"messages": [{
|
|
150
|
+
"role": "user", "content": "who are you?"
|
|
151
|
+
}],
|
|
152
|
+
"temperature": 0.7,
|
|
153
|
+
"stream": False
|
|
154
|
+
}
|
|
155
|
+
})
|
|
156
|
+
|
|
157
|
+
@staticmethod
|
|
158
|
+
def from_string(data: str,
|
|
159
|
+
*,
|
|
160
|
+
model: str | None = None,
|
|
161
|
+
temperature: float | None = None,
|
|
162
|
+
max_tokens: int | None = None,
|
|
163
|
+
top_p: float | None = None) -> "AIQChatRequest":
|
|
164
|
+
|
|
165
|
+
return AIQChatRequest(messages=[Message(content=data, role="user")],
|
|
166
|
+
model=model,
|
|
167
|
+
temperature=temperature,
|
|
168
|
+
max_tokens=max_tokens,
|
|
169
|
+
top_p=top_p)
|
|
170
|
+
|
|
171
|
+
@staticmethod
|
|
172
|
+
def from_content(content: list[UserContent],
|
|
173
|
+
*,
|
|
174
|
+
model: str | None = None,
|
|
175
|
+
temperature: float | None = None,
|
|
176
|
+
max_tokens: int | None = None,
|
|
177
|
+
top_p: float | None = None) -> "AIQChatRequest":
|
|
178
|
+
|
|
179
|
+
return AIQChatRequest(messages=[Message(content=content, role="user")],
|
|
180
|
+
model=model,
|
|
181
|
+
temperature=temperature,
|
|
182
|
+
max_tokens=max_tokens,
|
|
183
|
+
top_p=top_p)
|
|
184
|
+
|
|
185
|
+
|
|
186
|
+
class AIQChoiceMessage(BaseModel):
|
|
187
|
+
content: str | None = None
|
|
188
|
+
role: str | None = None
|
|
189
|
+
|
|
190
|
+
|
|
191
|
+
class AIQChoiceDelta(BaseModel):
|
|
192
|
+
"""Delta object for streaming responses (OpenAI-compatible)"""
|
|
193
|
+
content: str | None = None
|
|
194
|
+
role: str | None = None
|
|
195
|
+
|
|
196
|
+
|
|
197
|
+
class AIQChoice(BaseModel):
|
|
198
|
+
model_config = ConfigDict(extra="allow")
|
|
199
|
+
|
|
200
|
+
message: AIQChoiceMessage | None = None
|
|
201
|
+
delta: AIQChoiceDelta | None = None
|
|
202
|
+
finish_reason: typing.Literal['stop', 'length', 'tool_calls', 'content_filter', 'function_call'] | None = None
|
|
203
|
+
index: int
|
|
204
|
+
# logprobs: AIQChoiceLogprobs | None = None
|
|
205
|
+
|
|
206
|
+
|
|
207
|
+
class AIQUsage(BaseModel):
|
|
208
|
+
prompt_tokens: int
|
|
209
|
+
completion_tokens: int
|
|
210
|
+
total_tokens: int
|
|
211
|
+
|
|
212
|
+
|
|
213
|
+
class AIQResponseSerializable(abc.ABC):
|
|
214
|
+
"""
|
|
215
|
+
AIQChatResponseSerializable is an abstract class that defines the interface for serializing output for the AIQ
|
|
216
|
+
Toolkit chat streaming API.
|
|
217
|
+
"""
|
|
218
|
+
|
|
219
|
+
@abstractmethod
|
|
220
|
+
def get_stream_data(self) -> str:
|
|
221
|
+
pass
|
|
222
|
+
|
|
223
|
+
|
|
224
|
+
class AIQResponseBaseModelOutput(BaseModel, AIQResponseSerializable):
|
|
225
|
+
|
|
226
|
+
def get_stream_data(self) -> str:
|
|
227
|
+
return f"data: {self.model_dump_json()}\n\n"
|
|
228
|
+
|
|
229
|
+
|
|
230
|
+
class AIQResponseBaseModelIntermediate(BaseModel, AIQResponseSerializable):
|
|
231
|
+
|
|
232
|
+
def get_stream_data(self) -> str:
|
|
233
|
+
return f"intermediate_data: {self.model_dump_json()}\n\n"
|
|
234
|
+
|
|
235
|
+
|
|
236
|
+
class AIQChatResponse(AIQResponseBaseModelOutput):
|
|
237
|
+
"""
|
|
238
|
+
AIQChatResponse is a data model that represents a response from the AIQ Toolkit chat API.
|
|
239
|
+
Fully compatible with OpenAI Chat Completions API specification.
|
|
240
|
+
"""
|
|
241
|
+
|
|
242
|
+
# Allow extra fields in the model_config to support derived models
|
|
243
|
+
model_config = ConfigDict(extra="allow")
|
|
244
|
+
id: str
|
|
245
|
+
object: str = "chat.completion"
|
|
246
|
+
model: str = ""
|
|
247
|
+
created: datetime.datetime
|
|
248
|
+
choices: list[AIQChoice]
|
|
249
|
+
usage: AIQUsage | None = None
|
|
250
|
+
system_fingerprint: str | None = None
|
|
251
|
+
service_tier: typing.Literal["scale", "default"] | None = None
|
|
252
|
+
|
|
253
|
+
@field_serializer('created')
|
|
254
|
+
def serialize_created(self, created: datetime.datetime) -> int:
|
|
255
|
+
"""Serialize datetime to Unix timestamp for OpenAI compatibility"""
|
|
256
|
+
return int(created.timestamp())
|
|
257
|
+
|
|
258
|
+
@staticmethod
|
|
259
|
+
def from_string(data: str,
|
|
260
|
+
*,
|
|
261
|
+
id_: str | None = None,
|
|
262
|
+
object_: str | None = None,
|
|
263
|
+
model: str | None = None,
|
|
264
|
+
created: datetime.datetime | None = None,
|
|
265
|
+
usage: AIQUsage | None = None) -> "AIQChatResponse":
|
|
266
|
+
|
|
267
|
+
if id_ is None:
|
|
268
|
+
id_ = str(uuid.uuid4())
|
|
269
|
+
if object_ is None:
|
|
270
|
+
object_ = "chat.completion"
|
|
271
|
+
if model is None:
|
|
272
|
+
model = ""
|
|
273
|
+
if created is None:
|
|
274
|
+
created = datetime.datetime.now(datetime.timezone.utc)
|
|
275
|
+
|
|
276
|
+
return AIQChatResponse(
|
|
277
|
+
id=id_,
|
|
278
|
+
object=object_,
|
|
279
|
+
model=model,
|
|
280
|
+
created=created,
|
|
281
|
+
choices=[AIQChoice(index=0, message=AIQChoiceMessage(content=data), finish_reason="stop")],
|
|
282
|
+
usage=usage)
|
|
283
|
+
|
|
284
|
+
|
|
285
|
+
class AIQChatResponseChunk(AIQResponseBaseModelOutput):
|
|
286
|
+
"""
|
|
287
|
+
AIQChatResponseChunk is a data model that represents a response chunk from the AIQ Toolkit chat streaming API.
|
|
288
|
+
Fully compatible with OpenAI Chat Completions API specification.
|
|
289
|
+
"""
|
|
290
|
+
|
|
291
|
+
# Allow extra fields in the model_config to support derived models
|
|
292
|
+
model_config = ConfigDict(extra="allow")
|
|
293
|
+
|
|
294
|
+
id: str
|
|
295
|
+
choices: list[AIQChoice]
|
|
296
|
+
created: datetime.datetime
|
|
297
|
+
model: str = ""
|
|
298
|
+
object: str = "chat.completion.chunk"
|
|
299
|
+
system_fingerprint: str | None = None
|
|
300
|
+
service_tier: typing.Literal["scale", "default"] | None = None
|
|
301
|
+
usage: AIQUsage | None = None
|
|
302
|
+
|
|
303
|
+
@field_serializer('created')
|
|
304
|
+
def serialize_created(self, created: datetime.datetime) -> int:
|
|
305
|
+
"""Serialize datetime to Unix timestamp for OpenAI compatibility"""
|
|
306
|
+
return int(created.timestamp())
|
|
307
|
+
|
|
308
|
+
@staticmethod
|
|
309
|
+
def from_string(data: str,
|
|
310
|
+
*,
|
|
311
|
+
id_: str | None = None,
|
|
312
|
+
created: datetime.datetime | None = None,
|
|
313
|
+
model: str | None = None,
|
|
314
|
+
object_: str | None = None) -> "AIQChatResponseChunk":
|
|
315
|
+
|
|
316
|
+
if id_ is None:
|
|
317
|
+
id_ = str(uuid.uuid4())
|
|
318
|
+
if created is None:
|
|
319
|
+
created = datetime.datetime.now(datetime.timezone.utc)
|
|
320
|
+
if model is None:
|
|
321
|
+
model = ""
|
|
322
|
+
if object_ is None:
|
|
323
|
+
object_ = "chat.completion.chunk"
|
|
324
|
+
|
|
325
|
+
return AIQChatResponseChunk(
|
|
326
|
+
id=id_,
|
|
327
|
+
choices=[AIQChoice(index=0, message=AIQChoiceMessage(content=data), finish_reason="stop")],
|
|
328
|
+
created=created,
|
|
329
|
+
model=model,
|
|
330
|
+
object=object_)
|
|
331
|
+
|
|
332
|
+
@staticmethod
|
|
333
|
+
def create_streaming_chunk(content: str,
|
|
334
|
+
*,
|
|
335
|
+
id_: str | None = None,
|
|
336
|
+
created: datetime.datetime | None = None,
|
|
337
|
+
model: str | None = None,
|
|
338
|
+
role: str | None = None,
|
|
339
|
+
finish_reason: str | None = None,
|
|
340
|
+
usage: AIQUsage | None = None,
|
|
341
|
+
system_fingerprint: str | None = None) -> "AIQChatResponseChunk":
|
|
342
|
+
"""Create an OpenAI-compatible streaming chunk"""
|
|
343
|
+
if id_ is None:
|
|
344
|
+
id_ = str(uuid.uuid4())
|
|
345
|
+
if created is None:
|
|
346
|
+
created = datetime.datetime.now(datetime.timezone.utc)
|
|
347
|
+
if model is None:
|
|
348
|
+
model = ""
|
|
349
|
+
|
|
350
|
+
delta = AIQChoiceDelta(content=content,
|
|
351
|
+
role=role) if content is not None or role is not None else AIQChoiceDelta()
|
|
352
|
+
|
|
353
|
+
return AIQChatResponseChunk(
|
|
354
|
+
id=id_,
|
|
355
|
+
choices=[AIQChoice(index=0, message=None, delta=delta, finish_reason=finish_reason)],
|
|
356
|
+
created=created,
|
|
357
|
+
model=model,
|
|
358
|
+
object="chat.completion.chunk",
|
|
359
|
+
usage=usage,
|
|
360
|
+
system_fingerprint=system_fingerprint)
|
|
361
|
+
|
|
362
|
+
|
|
363
|
+
class AIQResponseIntermediateStep(AIQResponseBaseModelIntermediate):
|
|
364
|
+
"""
|
|
365
|
+
AIQResponseSerializedStep is a data model that represents a serialized step in the AIQ Toolkit chat streaming API.
|
|
366
|
+
"""
|
|
367
|
+
|
|
368
|
+
# Allow extra fields in the model_config to support derived models
|
|
369
|
+
model_config = ConfigDict(extra="allow")
|
|
370
|
+
|
|
371
|
+
id: str
|
|
372
|
+
parent_id: str | None = None
|
|
373
|
+
type: str = "markdown"
|
|
374
|
+
name: str
|
|
375
|
+
payload: str
|
|
376
|
+
|
|
377
|
+
|
|
378
|
+
class AIQResponsePayloadOutput(BaseModel, AIQResponseSerializable):
|
|
379
|
+
|
|
380
|
+
payload: typing.Any
|
|
381
|
+
|
|
382
|
+
def get_stream_data(self) -> str:
|
|
383
|
+
|
|
384
|
+
if (isinstance(self.payload, BaseModel)):
|
|
385
|
+
return f"data: {self.payload.model_dump_json()}\n\n"
|
|
386
|
+
|
|
387
|
+
return f"data: {self.payload}\n\n"
|
|
388
|
+
|
|
389
|
+
|
|
390
|
+
class AIQGenerateResponse(BaseModel):
|
|
391
|
+
# Allow extra fields in the model_config to support derived models
|
|
392
|
+
model_config = ConfigDict(extra="allow")
|
|
393
|
+
|
|
394
|
+
# (fixme) define the intermediate step model
|
|
395
|
+
intermediate_steps: list[tuple] | None = None
|
|
396
|
+
output: str
|
|
397
|
+
value: str | None = "default"
|
|
398
|
+
|
|
399
|
+
|
|
400
|
+
class UserMessageContentRoleType(str, Enum):
|
|
401
|
+
USER = "user"
|
|
402
|
+
ASSISTANT = "assistant"
|
|
403
|
+
|
|
404
|
+
|
|
405
|
+
class WebSocketMessageType(str, Enum):
|
|
406
|
+
"""
|
|
407
|
+
WebSocketMessageType is an Enum that represents WebSocket Message types.
|
|
408
|
+
"""
|
|
409
|
+
USER_MESSAGE = "user_message"
|
|
410
|
+
RESPONSE_MESSAGE = "system_response_message"
|
|
411
|
+
INTERMEDIATE_STEP_MESSAGE = "system_intermediate_message"
|
|
412
|
+
SYSTEM_INTERACTION_MESSAGE = "system_interaction_message"
|
|
413
|
+
USER_INTERACTION_MESSAGE = "user_interaction_message"
|
|
414
|
+
ERROR_MESSAGE = "error_message"
|
|
415
|
+
|
|
416
|
+
|
|
417
|
+
class WorkflowSchemaType(str, Enum):
|
|
418
|
+
"""
|
|
419
|
+
WorkflowSchemaType is an Enum that represents Workkflow response types.
|
|
420
|
+
"""
|
|
421
|
+
GENERATE_STREAM = "generate_stream"
|
|
422
|
+
CHAT_STREAM = "chat_stream"
|
|
423
|
+
GENERATE = "generate"
|
|
424
|
+
CHAT = "chat"
|
|
425
|
+
|
|
426
|
+
|
|
427
|
+
class WebSocketMessageStatus(str, Enum):
|
|
428
|
+
"""
|
|
429
|
+
WebSocketMessageStatus is an Enum that represents the status of a WebSocket message.
|
|
430
|
+
"""
|
|
431
|
+
IN_PROGRESS = "in_progress"
|
|
432
|
+
COMPLETE = "complete"
|
|
433
|
+
|
|
434
|
+
|
|
435
|
+
class UserMessages(BaseModel):
|
|
436
|
+
model_config = ConfigDict(extra="forbid")
|
|
437
|
+
|
|
438
|
+
role: UserMessageContentRoleType
|
|
439
|
+
content: list[UserContent]
|
|
440
|
+
|
|
441
|
+
|
|
442
|
+
class UserMessageContent(BaseModel):
|
|
443
|
+
model_config = ConfigDict(extra="forbid")
|
|
444
|
+
messages: list[UserMessages]
|
|
445
|
+
|
|
446
|
+
|
|
447
|
+
class User(BaseModel):
|
|
448
|
+
model_config = ConfigDict(extra="forbid")
|
|
449
|
+
|
|
450
|
+
name: str = "default"
|
|
451
|
+
email: str = "default"
|
|
452
|
+
|
|
453
|
+
|
|
454
|
+
class ErrorTypes(str, Enum):
|
|
455
|
+
UNKNOWN_ERROR = "unknown_error"
|
|
456
|
+
INVALID_MESSAGE = "invalid_message"
|
|
457
|
+
INVALID_MESSAGE_TYPE = "invalid_message_type"
|
|
458
|
+
INVALID_USER_MESSAGE_CONTENT = "invalid_user_message_content"
|
|
459
|
+
INVALID_DATA_CONTENT = "invalid_data_content"
|
|
460
|
+
|
|
461
|
+
|
|
462
|
+
class Error(BaseModel):
|
|
463
|
+
model_config = ConfigDict(extra="forbid")
|
|
464
|
+
|
|
465
|
+
code: ErrorTypes = ErrorTypes.UNKNOWN_ERROR
|
|
466
|
+
message: str = "default"
|
|
467
|
+
details: str = "default"
|
|
468
|
+
|
|
469
|
+
|
|
470
|
+
class WebSocketUserMessage(BaseModel):
|
|
471
|
+
"""
|
|
472
|
+
For more details, refer to the API documentation:
|
|
473
|
+
docs/source/developer_guide/websockets.md
|
|
474
|
+
"""
|
|
475
|
+
# Allow extra fields in the model_config to support derived models
|
|
476
|
+
model_config = ConfigDict(extra="allow")
|
|
477
|
+
|
|
478
|
+
type: typing.Literal[WebSocketMessageType.USER_MESSAGE]
|
|
479
|
+
schema_type: WorkflowSchemaType
|
|
480
|
+
id: str = "default"
|
|
481
|
+
conversation_id: str | None = None
|
|
482
|
+
content: UserMessageContent
|
|
483
|
+
user: User = User()
|
|
484
|
+
security: Security = Security()
|
|
485
|
+
error: Error = Error()
|
|
486
|
+
schema_version: str = "1.0.0"
|
|
487
|
+
timestamp: str = str(datetime.datetime.now(datetime.timezone.utc))
|
|
488
|
+
|
|
489
|
+
|
|
490
|
+
class WebSocketUserInteractionResponseMessage(BaseModel):
|
|
491
|
+
"""
|
|
492
|
+
For more details, refer to the API documentation:
|
|
493
|
+
docs/source/developer_guide/websockets.md
|
|
494
|
+
"""
|
|
495
|
+
type: typing.Literal[WebSocketMessageType.USER_INTERACTION_MESSAGE]
|
|
496
|
+
id: str = "default"
|
|
497
|
+
thread_id: str = "default"
|
|
498
|
+
content: UserMessageContent
|
|
499
|
+
user: User = User()
|
|
500
|
+
security: Security = Security()
|
|
501
|
+
error: Error = Error()
|
|
502
|
+
schema_version: str = "1.0.0"
|
|
503
|
+
timestamp: str = str(datetime.datetime.now(datetime.timezone.utc))
|
|
504
|
+
|
|
505
|
+
|
|
506
|
+
class SystemIntermediateStepContent(BaseModel):
|
|
507
|
+
model_config = ConfigDict(extra="forbid")
|
|
508
|
+
name: str
|
|
509
|
+
payload: str
|
|
510
|
+
|
|
511
|
+
|
|
512
|
+
class WebSocketSystemIntermediateStepMessage(BaseModel):
|
|
513
|
+
"""
|
|
514
|
+
For more details, refer to the API documentation:
|
|
515
|
+
docs/source/developer_guide/websockets.md
|
|
516
|
+
"""
|
|
517
|
+
# Allow extra fields in the model_config to support derived models
|
|
518
|
+
model_config = ConfigDict(extra="allow")
|
|
519
|
+
|
|
520
|
+
type: typing.Literal[WebSocketMessageType.INTERMEDIATE_STEP_MESSAGE]
|
|
521
|
+
id: str = "default"
|
|
522
|
+
thread_id: str | None = "default"
|
|
523
|
+
parent_id: str = "default"
|
|
524
|
+
intermediate_parent_id: str | None = "default"
|
|
525
|
+
update_message_id: str | None = "default"
|
|
526
|
+
content: SystemIntermediateStepContent
|
|
527
|
+
status: WebSocketMessageStatus
|
|
528
|
+
timestamp: str = str(datetime.datetime.now(datetime.timezone.utc))
|
|
529
|
+
|
|
530
|
+
|
|
531
|
+
class SystemResponseContent(BaseModel):
|
|
532
|
+
model_config = ConfigDict(extra="forbid")
|
|
533
|
+
|
|
534
|
+
text: str | None = None
|
|
535
|
+
|
|
536
|
+
|
|
537
|
+
class WebSocketSystemResponseTokenMessage(BaseModel):
|
|
538
|
+
"""
|
|
539
|
+
For more details, refer to the API documentation:
|
|
540
|
+
docs/source/developer_guide/websockets.md
|
|
541
|
+
"""
|
|
542
|
+
# Allow extra fields in the model_config to support derived models
|
|
543
|
+
model_config = ConfigDict(extra="allow")
|
|
544
|
+
|
|
545
|
+
type: typing.Literal[WebSocketMessageType.RESPONSE_MESSAGE, WebSocketMessageType.ERROR_MESSAGE]
|
|
546
|
+
id: str | None = "default"
|
|
547
|
+
thread_id: str | None = "default"
|
|
548
|
+
parent_id: str = "default"
|
|
549
|
+
content: SystemResponseContent | Error | AIQGenerateResponse
|
|
550
|
+
status: WebSocketMessageStatus
|
|
551
|
+
timestamp: str = str(datetime.datetime.now(datetime.timezone.utc))
|
|
552
|
+
|
|
553
|
+
@field_validator("content")
|
|
554
|
+
@classmethod
|
|
555
|
+
def validate_content_by_type(cls, value: SystemResponseContent | Error | AIQGenerateResponse, info: ValidationInfo):
|
|
556
|
+
if info.data.get("type") == WebSocketMessageType.ERROR_MESSAGE and not isinstance(value, Error):
|
|
557
|
+
raise ValueError(f"Field: content must be 'Error' when type is {WebSocketMessageType.ERROR_MESSAGE}")
|
|
558
|
+
|
|
559
|
+
if info.data.get("type") == WebSocketMessageType.RESPONSE_MESSAGE and not isinstance(
|
|
560
|
+
value, (SystemResponseContent, AIQGenerateResponse)):
|
|
561
|
+
raise ValueError(
|
|
562
|
+
f"Field: content must be 'SystemResponseContent' when type is {WebSocketMessageType.RESPONSE_MESSAGE}")
|
|
563
|
+
return value
|
|
564
|
+
|
|
565
|
+
|
|
566
|
+
class WebSocketSystemInteractionMessage(BaseModel):
|
|
567
|
+
"""
|
|
568
|
+
For more details, refer to the API documentation:
|
|
569
|
+
docs/source/developer_guide/websockets.md
|
|
570
|
+
"""
|
|
571
|
+
# Allow extra fields in the model_config to support derived models
|
|
572
|
+
model_config = ConfigDict(extra="allow")
|
|
573
|
+
|
|
574
|
+
type: typing.Literal[
|
|
575
|
+
WebSocketMessageType.SYSTEM_INTERACTION_MESSAGE] = WebSocketMessageType.SYSTEM_INTERACTION_MESSAGE
|
|
576
|
+
id: str | None = "default"
|
|
577
|
+
thread_id: str | None = "default"
|
|
578
|
+
parent_id: str = "default"
|
|
579
|
+
content: HumanPrompt
|
|
580
|
+
status: WebSocketMessageStatus
|
|
581
|
+
timestamp: str = str(datetime.datetime.now(datetime.timezone.utc))
|
|
582
|
+
|
|
583
|
+
|
|
584
|
+
# ======== AIQGenerateResponse Converters ========
|
|
585
|
+
|
|
586
|
+
|
|
587
|
+
def _generate_response_to_str(response: AIQGenerateResponse) -> str:
|
|
588
|
+
return response.output
|
|
589
|
+
|
|
590
|
+
|
|
591
|
+
GlobalTypeConverter.register_converter(_generate_response_to_str)
|
|
592
|
+
|
|
593
|
+
|
|
594
|
+
def _generate_response_to_chat_response(response: AIQGenerateResponse) -> AIQChatResponse:
|
|
595
|
+
data = response.output
|
|
596
|
+
|
|
597
|
+
# Simulate usage
|
|
598
|
+
prompt_tokens = 0
|
|
599
|
+
usage = AIQUsage(prompt_tokens=prompt_tokens,
|
|
600
|
+
completion_tokens=len(data.split()),
|
|
601
|
+
total_tokens=prompt_tokens + len(data.split()))
|
|
602
|
+
|
|
603
|
+
# Build and return the response
|
|
604
|
+
return AIQChatResponse.from_string(data, usage=usage)
|
|
605
|
+
|
|
606
|
+
|
|
607
|
+
GlobalTypeConverter.register_converter(_generate_response_to_chat_response)
|
|
608
|
+
|
|
609
|
+
|
|
610
|
+
# ======== AIQChatRequest Converters ========
|
|
611
|
+
def _aiq_chat_request_to_string(data: AIQChatRequest) -> str:
|
|
612
|
+
if isinstance(data.messages[-1].content, str):
|
|
613
|
+
return data.messages[-1].content
|
|
614
|
+
return str(data.messages[-1].content)
|
|
615
|
+
|
|
616
|
+
|
|
617
|
+
GlobalTypeConverter.register_converter(_aiq_chat_request_to_string)
|
|
618
|
+
|
|
619
|
+
|
|
620
|
+
def _string_to_aiq_chat_request(data: str) -> AIQChatRequest:
|
|
621
|
+
return AIQChatRequest.from_string(data, model="")
|
|
622
|
+
|
|
623
|
+
|
|
624
|
+
GlobalTypeConverter.register_converter(_string_to_aiq_chat_request)
|
|
625
|
+
|
|
626
|
+
|
|
627
|
+
# ======== AIQChatResponse Converters ========
|
|
628
|
+
def _aiq_chat_response_to_string(data: AIQChatResponse) -> str:
|
|
629
|
+
return data.choices[0].message.content or ""
|
|
630
|
+
|
|
631
|
+
|
|
632
|
+
GlobalTypeConverter.register_converter(_aiq_chat_response_to_string)
|
|
633
|
+
|
|
634
|
+
|
|
635
|
+
def _string_to_aiq_chat_response(data: str) -> AIQChatResponse:
|
|
636
|
+
'''Converts a string to an AIQChatResponse object'''
|
|
637
|
+
|
|
638
|
+
# Simulate usage
|
|
639
|
+
prompt_tokens = 0
|
|
640
|
+
usage = AIQUsage(prompt_tokens=prompt_tokens,
|
|
641
|
+
completion_tokens=len(data.split()),
|
|
642
|
+
total_tokens=prompt_tokens + len(data.split()))
|
|
643
|
+
|
|
644
|
+
# Build and return the response
|
|
645
|
+
return AIQChatResponse.from_string(data, usage=usage)
|
|
646
|
+
|
|
647
|
+
|
|
648
|
+
GlobalTypeConverter.register_converter(_string_to_aiq_chat_response)
|
|
649
|
+
|
|
650
|
+
|
|
651
|
+
def _chat_response_to_chat_response_chunk(data: AIQChatResponse) -> AIQChatResponseChunk:
|
|
652
|
+
# Preserve original message structure for backward compatibility
|
|
653
|
+
return AIQChatResponseChunk(id=data.id, choices=data.choices, created=data.created, model=data.model)
|
|
654
|
+
|
|
655
|
+
|
|
656
|
+
GlobalTypeConverter.register_converter(_chat_response_to_chat_response_chunk)
|
|
657
|
+
|
|
658
|
+
|
|
659
|
+
# ======== AIQChatResponseChunk Converters ========
|
|
660
|
+
def _aiq_chat_response_chunk_to_string(data: AIQChatResponseChunk) -> str:
|
|
661
|
+
if data.choices and len(data.choices) > 0:
|
|
662
|
+
choice = data.choices[0]
|
|
663
|
+
if choice.delta and choice.delta.content:
|
|
664
|
+
return choice.delta.content
|
|
665
|
+
if choice.message and choice.message.content:
|
|
666
|
+
return choice.message.content
|
|
667
|
+
return ""
|
|
668
|
+
|
|
669
|
+
|
|
670
|
+
GlobalTypeConverter.register_converter(_aiq_chat_response_chunk_to_string)
|
|
671
|
+
|
|
672
|
+
|
|
673
|
+
def _string_to_aiq_chat_response_chunk(data: str) -> AIQChatResponseChunk:
|
|
674
|
+
'''Converts a string to an AIQChatResponseChunk object'''
|
|
675
|
+
|
|
676
|
+
# Build and return the response
|
|
677
|
+
return AIQChatResponseChunk.from_string(data)
|
|
678
|
+
|
|
679
|
+
|
|
680
|
+
GlobalTypeConverter.register_converter(_string_to_aiq_chat_response_chunk)
|
|
681
|
+
|
|
682
|
+
|
|
683
|
+
# ======== AINodeMessageChunk Converters ========
|
|
684
|
+
def _ai_message_chunk_to_aiq_chat_response_chunk(data) -> AIQChatResponseChunk:
|
|
685
|
+
'''Converts LangChain AINodeMessageChunk to AIQChatResponseChunk'''
|
|
686
|
+
content = ""
|
|
687
|
+
if hasattr(data, 'content') and data.content is not None:
|
|
688
|
+
content = str(data.content)
|
|
689
|
+
elif hasattr(data, 'text') and data.text is not None:
|
|
690
|
+
content = str(data.text)
|
|
691
|
+
elif hasattr(data, 'message') and data.message is not None:
|
|
692
|
+
content = str(data.message)
|
|
693
|
+
|
|
694
|
+
return AIQChatResponseChunk.create_streaming_chunk(content=content, role="assistant", finish_reason=None)
|