PyPI - aiqtoolkit - Versions diffs - 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl - Mend

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2rc9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show

aiqtoolkit-1.2rc9.dist-info/METADATA +29 -0
aiqtoolkit-1.2rc9.dist-info/RECORD +4 -0
aiqtoolkit-1.2rc9.dist-info/top_level.txt +1 -0
aiq/agent/__init__.py +0 -0
aiq/agent/base.py +0 -239
aiq/agent/dual_node.py +0 -67
aiq/agent/react_agent/__init__.py +0 -0
aiq/agent/react_agent/agent.py +0 -355
aiq/agent/react_agent/output_parser.py +0 -104
aiq/agent/react_agent/prompt.py +0 -41
aiq/agent/react_agent/register.py +0 -149
aiq/agent/reasoning_agent/__init__.py +0 -0
aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
aiq/agent/register.py +0 -23
aiq/agent/rewoo_agent/__init__.py +0 -0
aiq/agent/rewoo_agent/agent.py +0 -411
aiq/agent/rewoo_agent/prompt.py +0 -108
aiq/agent/rewoo_agent/register.py +0 -158
aiq/agent/tool_calling_agent/__init__.py +0 -0
aiq/agent/tool_calling_agent/agent.py +0 -119
aiq/agent/tool_calling_agent/register.py +0 -106
aiq/authentication/__init__.py +0 -14
aiq/authentication/api_key/__init__.py +0 -14
aiq/authentication/api_key/api_key_auth_provider.py +0 -96
aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
aiq/authentication/api_key/register.py +0 -26
aiq/authentication/exceptions/__init__.py +0 -14
aiq/authentication/exceptions/api_key_exceptions.py +0 -38
aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
aiq/authentication/exceptions/call_back_exceptions.py +0 -38
aiq/authentication/exceptions/request_exceptions.py +0 -54
aiq/authentication/http_basic_auth/__init__.py +0 -0
aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
aiq/authentication/http_basic_auth/register.py +0 -30
aiq/authentication/interfaces.py +0 -93
aiq/authentication/oauth2/__init__.py +0 -14
aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
aiq/authentication/oauth2/register.py +0 -25
aiq/authentication/register.py +0 -21
aiq/builder/__init__.py +0 -0
aiq/builder/builder.py +0 -285
aiq/builder/component_utils.py +0 -316
aiq/builder/context.py +0 -264
aiq/builder/embedder.py +0 -24
aiq/builder/eval_builder.py +0 -161
aiq/builder/evaluator.py +0 -29
aiq/builder/framework_enum.py +0 -24
aiq/builder/front_end.py +0 -73
aiq/builder/function.py +0 -344
aiq/builder/function_base.py +0 -380
aiq/builder/function_info.py +0 -627
aiq/builder/intermediate_step_manager.py +0 -174
aiq/builder/llm.py +0 -25
aiq/builder/retriever.py +0 -25
aiq/builder/user_interaction_manager.py +0 -74
aiq/builder/workflow.py +0 -148
aiq/builder/workflow_builder.py +0 -1117
aiq/cli/__init__.py +0 -14
aiq/cli/cli_utils/__init__.py +0 -0
aiq/cli/cli_utils/config_override.py +0 -231
aiq/cli/cli_utils/validation.py +0 -37
aiq/cli/commands/__init__.py +0 -0
aiq/cli/commands/configure/__init__.py +0 -0
aiq/cli/commands/configure/channel/__init__.py +0 -0
aiq/cli/commands/configure/channel/add.py +0 -28
aiq/cli/commands/configure/channel/channel.py +0 -36
aiq/cli/commands/configure/channel/remove.py +0 -30
aiq/cli/commands/configure/channel/update.py +0 -30
aiq/cli/commands/configure/configure.py +0 -33
aiq/cli/commands/evaluate.py +0 -139
aiq/cli/commands/info/__init__.py +0 -14
aiq/cli/commands/info/info.py +0 -39
aiq/cli/commands/info/list_channels.py +0 -32
aiq/cli/commands/info/list_components.py +0 -129
aiq/cli/commands/info/list_mcp.py +0 -213
aiq/cli/commands/registry/__init__.py +0 -14
aiq/cli/commands/registry/publish.py +0 -88
aiq/cli/commands/registry/pull.py +0 -118
aiq/cli/commands/registry/registry.py +0 -38
aiq/cli/commands/registry/remove.py +0 -108
aiq/cli/commands/registry/search.py +0 -155
aiq/cli/commands/sizing/__init__.py +0 -14
aiq/cli/commands/sizing/calc.py +0 -297
aiq/cli/commands/sizing/sizing.py +0 -27
aiq/cli/commands/start.py +0 -246
aiq/cli/commands/uninstall.py +0 -81
aiq/cli/commands/validate.py +0 -47
aiq/cli/commands/workflow/__init__.py +0 -14
aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
aiq/cli/commands/workflow/workflow.py +0 -37
aiq/cli/commands/workflow/workflow_commands.py +0 -313
aiq/cli/entrypoint.py +0 -135
aiq/cli/main.py +0 -44
aiq/cli/register_workflow.py +0 -488
aiq/cli/type_registry.py +0 -1000
aiq/data_models/__init__.py +0 -14
aiq/data_models/api_server.py +0 -694
aiq/data_models/authentication.py +0 -231
aiq/data_models/common.py +0 -171
aiq/data_models/component.py +0 -54
aiq/data_models/component_ref.py +0 -168
aiq/data_models/config.py +0 -406
aiq/data_models/dataset_handler.py +0 -123
aiq/data_models/discovery_metadata.py +0 -335
aiq/data_models/embedder.py +0 -27
aiq/data_models/evaluate.py +0 -127
aiq/data_models/evaluator.py +0 -26
aiq/data_models/front_end.py +0 -26
aiq/data_models/function.py +0 -30
aiq/data_models/function_dependencies.py +0 -72
aiq/data_models/interactive.py +0 -246
aiq/data_models/intermediate_step.py +0 -302
aiq/data_models/invocation_node.py +0 -38
aiq/data_models/its_strategy.py +0 -30
aiq/data_models/llm.py +0 -27
aiq/data_models/logging.py +0 -26
aiq/data_models/memory.py +0 -27
aiq/data_models/object_store.py +0 -44
aiq/data_models/profiler.py +0 -54
aiq/data_models/registry_handler.py +0 -26
aiq/data_models/retriever.py +0 -30
aiq/data_models/retry_mixin.py +0 -35
aiq/data_models/span.py +0 -187
aiq/data_models/step_adaptor.py +0 -64
aiq/data_models/streaming.py +0 -33
aiq/data_models/swe_bench_model.py +0 -54
aiq/data_models/telemetry_exporter.py +0 -26
aiq/embedder/__init__.py +0 -0
aiq/embedder/langchain_client.py +0 -41
aiq/embedder/nim_embedder.py +0 -59
aiq/embedder/openai_embedder.py +0 -43
aiq/embedder/register.py +0 -24
aiq/eval/__init__.py +0 -14
aiq/eval/config.py +0 -60
aiq/eval/dataset_handler/__init__.py +0 -0
aiq/eval/dataset_handler/dataset_downloader.py +0 -106
aiq/eval/dataset_handler/dataset_filter.py +0 -52
aiq/eval/dataset_handler/dataset_handler.py +0 -254
aiq/eval/evaluate.py +0 -506
aiq/eval/evaluator/__init__.py +0 -14
aiq/eval/evaluator/base_evaluator.py +0 -73
aiq/eval/evaluator/evaluator_model.py +0 -45
aiq/eval/intermediate_step_adapter.py +0 -99
aiq/eval/rag_evaluator/__init__.py +0 -0
aiq/eval/rag_evaluator/evaluate.py +0 -178
aiq/eval/rag_evaluator/register.py +0 -143
aiq/eval/register.py +0 -23
aiq/eval/remote_workflow.py +0 -133
aiq/eval/runners/__init__.py +0 -14
aiq/eval/runners/config.py +0 -39
aiq/eval/runners/multi_eval_runner.py +0 -54
aiq/eval/runtime_event_subscriber.py +0 -52
aiq/eval/swe_bench_evaluator/__init__.py +0 -0
aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
aiq/eval/swe_bench_evaluator/register.py +0 -36
aiq/eval/trajectory_evaluator/__init__.py +0 -0
aiq/eval/trajectory_evaluator/evaluate.py +0 -75
aiq/eval/trajectory_evaluator/register.py +0 -40
aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
aiq/eval/tunable_rag_evaluator/register.py +0 -52
aiq/eval/usage_stats.py +0 -41
aiq/eval/utils/__init__.py +0 -0
aiq/eval/utils/output_uploader.py +0 -140
aiq/eval/utils/tqdm_position_registry.py +0 -40
aiq/eval/utils/weave_eval.py +0 -184
aiq/experimental/__init__.py +0 -0
aiq/experimental/decorators/__init__.py +0 -0
aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
aiq/experimental/inference_time_scaling/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
aiq/experimental/inference_time_scaling/register.py +0 -36
aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
aiq/front_ends/__init__.py +0 -14
aiq/front_ends/console/__init__.py +0 -14
aiq/front_ends/console/authentication_flow_handler.py +0 -233
aiq/front_ends/console/console_front_end_config.py +0 -32
aiq/front_ends/console/console_front_end_plugin.py +0 -96
aiq/front_ends/console/register.py +0 -25
aiq/front_ends/cron/__init__.py +0 -14
aiq/front_ends/fastapi/__init__.py +0 -14
aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
aiq/front_ends/fastapi/job_store.py +0 -183
aiq/front_ends/fastapi/main.py +0 -72
aiq/front_ends/fastapi/message_handler.py +0 -298
aiq/front_ends/fastapi/message_validator.py +0 -345
aiq/front_ends/fastapi/register.py +0 -25
aiq/front_ends/fastapi/response_helpers.py +0 -195
aiq/front_ends/fastapi/step_adaptor.py +0 -321
aiq/front_ends/mcp/__init__.py +0 -14
aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
aiq/front_ends/mcp/register.py +0 -27
aiq/front_ends/mcp/tool_converter.py +0 -242
aiq/front_ends/register.py +0 -22
aiq/front_ends/simple_base/__init__.py +0 -14
aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
aiq/llm/__init__.py +0 -0
aiq/llm/aws_bedrock_llm.py +0 -57
aiq/llm/nim_llm.py +0 -46
aiq/llm/openai_llm.py +0 -46
aiq/llm/register.py +0 -23
aiq/llm/utils/__init__.py +0 -14
aiq/llm/utils/env_config_value.py +0 -94
aiq/llm/utils/error.py +0 -17
aiq/memory/__init__.py +0 -20
aiq/memory/interfaces.py +0 -183
aiq/memory/models.py +0 -112
aiq/meta/module_to_distro.json +0 -3
aiq/meta/pypi.md +0 -58
aiq/object_store/__init__.py +0 -20
aiq/object_store/in_memory_object_store.py +0 -76
aiq/object_store/interfaces.py +0 -84
aiq/object_store/models.py +0 -36
aiq/object_store/register.py +0 -20
aiq/observability/__init__.py +0 -14
aiq/observability/exporter/__init__.py +0 -14
aiq/observability/exporter/base_exporter.py +0 -449
aiq/observability/exporter/exporter.py +0 -78
aiq/observability/exporter/file_exporter.py +0 -33
aiq/observability/exporter/processing_exporter.py +0 -322
aiq/observability/exporter/raw_exporter.py +0 -52
aiq/observability/exporter/span_exporter.py +0 -265
aiq/observability/exporter_manager.py +0 -335
aiq/observability/mixin/__init__.py +0 -14
aiq/observability/mixin/batch_config_mixin.py +0 -26
aiq/observability/mixin/collector_config_mixin.py +0 -23
aiq/observability/mixin/file_mixin.py +0 -288
aiq/observability/mixin/file_mode.py +0 -23
aiq/observability/mixin/resource_conflict_mixin.py +0 -134
aiq/observability/mixin/serialize_mixin.py +0 -61
aiq/observability/mixin/type_introspection_mixin.py +0 -183
aiq/observability/processor/__init__.py +0 -14
aiq/observability/processor/batching_processor.py +0 -309
aiq/observability/processor/callback_processor.py +0 -42
aiq/observability/processor/intermediate_step_serializer.py +0 -28
aiq/observability/processor/processor.py +0 -71
aiq/observability/register.py +0 -96
aiq/observability/utils/__init__.py +0 -14
aiq/observability/utils/dict_utils.py +0 -236
aiq/observability/utils/time_utils.py +0 -31
aiq/plugins/.namespace +0 -1
aiq/profiler/__init__.py +0 -0
aiq/profiler/calc/__init__.py +0 -14
aiq/profiler/calc/calc_runner.py +0 -627
aiq/profiler/calc/calculations.py +0 -288
aiq/profiler/calc/data_models.py +0 -188
aiq/profiler/calc/plot.py +0 -345
aiq/profiler/callbacks/__init__.py +0 -0
aiq/profiler/callbacks/agno_callback_handler.py +0 -295
aiq/profiler/callbacks/base_callback_class.py +0 -20
aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
aiq/profiler/callbacks/token_usage_base_model.py +0 -27
aiq/profiler/data_frame_row.py +0 -51
aiq/profiler/data_models.py +0 -24
aiq/profiler/decorators/__init__.py +0 -0
aiq/profiler/decorators/framework_wrapper.py +0 -131
aiq/profiler/decorators/function_tracking.py +0 -254
aiq/profiler/forecasting/__init__.py +0 -0
aiq/profiler/forecasting/config.py +0 -18
aiq/profiler/forecasting/model_trainer.py +0 -75
aiq/profiler/forecasting/models/__init__.py +0 -22
aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
aiq/profiler/forecasting/models/linear_model.py +0 -196
aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
aiq/profiler/inference_metrics_model.py +0 -28
aiq/profiler/inference_optimization/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
aiq/profiler/inference_optimization/data_models.py +0 -386
aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
aiq/profiler/inference_optimization/llm_metrics.py +0 -212
aiq/profiler/inference_optimization/prompt_caching.py +0 -163
aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
aiq/profiler/intermediate_property_adapter.py +0 -102
aiq/profiler/profile_runner.py +0 -473
aiq/profiler/utils.py +0 -184
aiq/registry_handlers/__init__.py +0 -0
aiq/registry_handlers/local/__init__.py +0 -0
aiq/registry_handlers/local/local_handler.py +0 -176
aiq/registry_handlers/local/register_local.py +0 -37
aiq/registry_handlers/metadata_factory.py +0 -60
aiq/registry_handlers/package_utils.py +0 -567
aiq/registry_handlers/pypi/__init__.py +0 -0
aiq/registry_handlers/pypi/pypi_handler.py +0 -251
aiq/registry_handlers/pypi/register_pypi.py +0 -40
aiq/registry_handlers/register.py +0 -21
aiq/registry_handlers/registry_handler_base.py +0 -157
aiq/registry_handlers/rest/__init__.py +0 -0
aiq/registry_handlers/rest/register_rest.py +0 -56
aiq/registry_handlers/rest/rest_handler.py +0 -237
aiq/registry_handlers/schemas/__init__.py +0 -0
aiq/registry_handlers/schemas/headers.py +0 -42
aiq/registry_handlers/schemas/package.py +0 -68
aiq/registry_handlers/schemas/publish.py +0 -63
aiq/registry_handlers/schemas/pull.py +0 -82
aiq/registry_handlers/schemas/remove.py +0 -36
aiq/registry_handlers/schemas/search.py +0 -91
aiq/registry_handlers/schemas/status.py +0 -47
aiq/retriever/__init__.py +0 -0
aiq/retriever/interface.py +0 -37
aiq/retriever/milvus/__init__.py +0 -14
aiq/retriever/milvus/register.py +0 -81
aiq/retriever/milvus/retriever.py +0 -228
aiq/retriever/models.py +0 -74
aiq/retriever/nemo_retriever/__init__.py +0 -14
aiq/retriever/nemo_retriever/register.py +0 -60
aiq/retriever/nemo_retriever/retriever.py +0 -190
aiq/retriever/register.py +0 -22
aiq/runtime/__init__.py +0 -14
aiq/runtime/loader.py +0 -215
aiq/runtime/runner.py +0 -190
aiq/runtime/session.py +0 -158
aiq/runtime/user_metadata.py +0 -130
aiq/settings/__init__.py +0 -0
aiq/settings/global_settings.py +0 -318
aiq/test/.namespace +0 -1
aiq/tool/__init__.py +0 -0
aiq/tool/chat_completion.py +0 -74
aiq/tool/code_execution/README.md +0 -151
aiq/tool/code_execution/__init__.py +0 -0
aiq/tool/code_execution/code_sandbox.py +0 -267
aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
aiq/tool/code_execution/register.py +0 -74
aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
aiq/tool/code_execution/utils.py +0 -100
aiq/tool/datetime_tools.py +0 -42
aiq/tool/document_search.py +0 -141
aiq/tool/github_tools/__init__.py +0 -0
aiq/tool/github_tools/create_github_commit.py +0 -133
aiq/tool/github_tools/create_github_issue.py +0 -87
aiq/tool/github_tools/create_github_pr.py +0 -106
aiq/tool/github_tools/get_github_file.py +0 -106
aiq/tool/github_tools/get_github_issue.py +0 -166
aiq/tool/github_tools/get_github_pr.py +0 -256
aiq/tool/github_tools/update_github_issue.py +0 -100
aiq/tool/mcp/__init__.py +0 -14
aiq/tool/mcp/exceptions.py +0 -142
aiq/tool/mcp/mcp_client.py +0 -255
aiq/tool/mcp/mcp_tool.py +0 -96
aiq/tool/memory_tools/__init__.py +0 -0
aiq/tool/memory_tools/add_memory_tool.py +0 -79
aiq/tool/memory_tools/delete_memory_tool.py +0 -67
aiq/tool/memory_tools/get_memory_tool.py +0 -72
aiq/tool/nvidia_rag.py +0 -95
aiq/tool/register.py +0 -38
aiq/tool/retriever.py +0 -89
aiq/tool/server_tools.py +0 -66
aiq/utils/__init__.py +0 -0
aiq/utils/data_models/__init__.py +0 -0
aiq/utils/data_models/schema_validator.py +0 -58
aiq/utils/debugging_utils.py +0 -43
aiq/utils/dump_distro_mapping.py +0 -32
aiq/utils/exception_handlers/__init__.py +0 -0
aiq/utils/exception_handlers/automatic_retries.py +0 -289
aiq/utils/exception_handlers/mcp.py +0 -211
aiq/utils/exception_handlers/schemas.py +0 -114
aiq/utils/io/__init__.py +0 -0
aiq/utils/io/model_processing.py +0 -28
aiq/utils/io/yaml_tools.py +0 -119
aiq/utils/log_utils.py +0 -37
aiq/utils/metadata_utils.py +0 -74
aiq/utils/optional_imports.py +0 -142
aiq/utils/producer_consumer_queue.py +0 -178
aiq/utils/reactive/__init__.py +0 -0
aiq/utils/reactive/base/__init__.py +0 -0
aiq/utils/reactive/base/observable_base.py +0 -65
aiq/utils/reactive/base/observer_base.py +0 -55
aiq/utils/reactive/base/subject_base.py +0 -79
aiq/utils/reactive/observable.py +0 -59
aiq/utils/reactive/observer.py +0 -76
aiq/utils/reactive/subject.py +0 -131
aiq/utils/reactive/subscription.py +0 -49
aiq/utils/settings/__init__.py +0 -0
aiq/utils/settings/global_settings.py +0 -197
aiq/utils/string_utils.py +0 -38
aiq/utils/type_converter.py +0 -290
aiq/utils/type_utils.py +0 -484
aiq/utils/url_utils.py +0 -27
aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
{aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2rc9.dist-info}/WHEEL +0 -0

aiq/profiler/calc/calculations.py DELETED Viewed

@@ -1,288 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import logging
-import numpy as np
-from aiq.profiler.calc.data_models import FitConfig
-from aiq.profiler.calc.data_models import GPUEstimates
-from aiq.profiler.calc.data_models import LinearFitResult
-logger = logging.getLogger(__name__)
-def compute_slope(concurrencies: list[float],
-                  time_metrics: list[float],
-                  fit_config: FitConfig | None = None) -> LinearFitResult:
-    """
-    Concurrency is the independent variable (x-axis) and time metric (which can be runtime or latency)
-    is the dependent variable (y-axis). This function computes the slope of the linear relationship
-    between concurrency and time metric.
-    Args:
-        concurrencies: List of concurrency values (x-axis)
-        time_metrics: List of time metric values (y-axis)
-        fit_config: Configuration for outlier detection and fit validation
-    Returns:
-        LinearFitResult containing slope, intercept, R-squared, and outliers removed
-    Raises:
-        ValueError: If the relationship is not linear (R² < min_r_squared)
-    """
-    # Use default config if none provided
-    if fit_config is None:
-        fit_config = FitConfig()
-    # Convert to numpy arrays for calculations
-    x = np.array(concurrencies)
-    y = np.array(time_metrics)
-    # Validate input
-    if len(x) != len(y):
-        raise ValueError("Concurrencies and time_metrics must have the same length")
-    if len(x) < 2:
-        raise ValueError("Need at least 2 points for linear regression")
-    outliers_removed = []
-    # Remove outliers if requested
-    if fit_config.remove_outliers and len(x) > 4:  # Need at least 4 points for outlier detection
-        x_clean, y_clean, removed_concurrencies = _remove_outliers(x, y, fit_config)
-        x, y = x_clean, y_clean
-        outliers_removed = removed_concurrencies
-    # Calculate linear regression using least squares
-    n = len(x)
-    sum_x = x.sum()
-    sum_y = y.sum()
-    sum_xy = (x * y).sum()
-    sum_x2 = (x**2).sum()
-    # Calculate slope and intercept
-    slope = (n * sum_xy - sum_x * sum_y) / (n * sum_x2 - sum_x**2)
-    intercept = (sum_y - slope * sum_x) / n
-    # Calculate R-squared
-    y_pred = slope * x + intercept
-    ss_res = ((y - y_pred)**2).sum()
-    ss_tot = ((y - y.mean())**2).sum()
-    r_squared = 1 - (ss_res / ss_tot) if ss_tot != 0 else 0.0
-    # Validate linearity
-    if r_squared < fit_config.min_r_squared:
-        raise ValueError(f"Poor linear fit detected (R² = {r_squared:.3f} < {fit_config.min_r_squared}). "
-                         f"The relationship may not be linear. Consider using non-linear regression.")
-    return LinearFitResult(slope=slope, intercept=intercept, r_squared=r_squared, outliers_removed=outliers_removed)
-def _remove_outliers(x: np.ndarray, y: np.ndarray, fit_config: FitConfig) -> tuple[np.ndarray, np.ndarray, list[int]]:
-    """
-    Remove outliers using the Interquartile Range (IQR) method.
-    For small concurrency range (≤ threshold points), also checks raw y-values for extreme outliers.
-    Args:
-        x: Input x values (concurrencies)
-        y: Input y values (time metrics)
-        fit_config: Configuration for outlier detection
-    Returns:
-        Tuple of (cleaned_x, cleaned_y, list_of_removed_concurrencies)
-    """
-    # if the number of concurrency points is less removing outliers can be challenging
-    # as extreme outliers can skew the results.
-    # We use a threshold to check for extreme outliers in raw y-values first.
-    n = len(x)
-    all_removed_concurrencies = []
-    # For smaller concurrency ranges, check for extreme outliers in raw y-values first
-    if n <= fit_config.small_concurrency_range_threshold:
-        # Calculate IQR on raw y-values
-        y_q1 = np.percentile(y, 25)
-        y_q3 = np.percentile(y, 75)
-        y_iqr = y_q3 - y_q1
-        # Use a more aggressive threshold for small datasets
-        y_lower_bound = y_q1 - fit_config.extreme_outlier_threshold * y_iqr  # More aggressive than 1.5
-        y_upper_bound = y_q3 + fit_config.extreme_outlier_threshold * y_iqr
-        # Find extreme outliers in raw values
-        extreme_outlier_mask = (y >= y_lower_bound) & (y <= y_upper_bound)
-        extreme_outliers_removed = np.sum(~extreme_outlier_mask)
-        if extreme_outliers_removed > 0:
-            extreme_removed_concurrencies = x[~extreme_outlier_mask].tolist()
-            all_removed_concurrencies.extend(extreme_removed_concurrencies)
-            logger.info("Removed %d extreme outliers from raw values: concurrencies %s",
-                        extreme_outliers_removed,
-                        extreme_removed_concurrencies)
-            # Continue with residual-based detection on the cleaned data
-            x = x[extreme_outlier_mask]
-            y = y[extreme_outlier_mask]
-            n = len(x)
-    # Standard residual-based outlier detection
-    # Calculate residuals from a simple linear fit
-    if n == 0:
-        raise ValueError("No data points remaining after outlier removal. Cannot compute linear fit.")
-    sum_x = x.sum()
-    sum_y = y.sum()
-    sum_xy = (x * y).sum()
-    sum_x2 = (x**2).sum()
-    slope = (n * sum_xy - sum_x * sum_y) / (n * sum_x2 - sum_x**2)
-    intercept = (sum_y - slope * sum_x) / n
-    # Calculate residuals
-    y_pred = slope * x + intercept
-    residuals = y - y_pred
-    # Use IQR method to detect outliers
-    q1 = np.percentile(residuals, 25)
-    q3 = np.percentile(residuals, 75)
-    iqr = q3 - q1
-    # Define outlier bounds (1.5 * IQR rule)
-    lower_bound = q1 - fit_config.conservative_outlier_threshold * iqr
-    upper_bound = q3 + fit_config.conservative_outlier_threshold * iqr
-    # Find non-outlier indices
-    non_outlier_mask = (residuals >= lower_bound) & (residuals <= upper_bound)
-    outliers_removed = np.sum(~non_outlier_mask)
-    residual_removed_concurrencies = x[~non_outlier_mask].tolist()
-    all_removed_concurrencies.extend(residual_removed_concurrencies)
-    # Add debugging for small datasets
-    if len(x) <= fit_config.small_concurrency_range_threshold:
-        logger.debug("Outlier detection for small dataset (n=%d):", len(x))
-        logger.debug("  Data points: %s", list(zip(x, y)))
-        logger.debug("  Residuals: %s", residuals.tolist())
-        logger.debug("  Q1=%.3f, Q3=%.3f, IQR=%.3f", q1, q3, iqr)
-        logger.debug("  Bounds: [%.3f, %.3f]", lower_bound, upper_bound)
-        logger.info("  Outliers removed: %d (concurrencies: %s)", outliers_removed, residual_removed_concurrencies)
-    return x[non_outlier_mask], y[non_outlier_mask], all_removed_concurrencies
-def calc_gpu_estimate_based_on_slope(target_time_metric: float,
-                                     target_users: int,
-                                     test_gpu_count: int,
-                                     observed_slope: float,
-                                     observed_intercept: float = 0.0) -> float:
-    """
-    Calculate the GPU estimate based on the slope of the time metric.
-    This function uses the linear relationship between concurrency and time metrics
-    to estimate the required GPU count for a target user load.
-    Args:
-        target_time_metric: Target time metric (latency or runtime) in seconds
-        observed_slope: Slope from linear regression of time vs concurrency
-        target_users: Target number of concurrent users
-        test_gpu_count: Number of GPUs used in the test
-        observed_intercept: Y-intercept from linear regression (default: 0.0)
-    Returns:
-        Estimated number of GPUs required
-    Raises:
-        ValueError: If target_time_metric is less than or equal to intercept
-    """
-    if target_time_metric <= observed_intercept:
-        raise ValueError(f"Target time metric ({target_time_metric}) must be greater than "
-                         f"the intercept ({observed_intercept}) for valid GPU estimation.")
-    # Calculate the concurrency that would achieve the target time metric
-    # Using the linear equation: time = slope * concurrency + intercept
-    # Solving for concurrency: concurrency = (time - intercept) / slope
-    calculated_concurrency = (target_time_metric - observed_intercept) / observed_slope
-    logger.info("Calculated concurrency: %f for target time metric: %f, observed intercept: %f, observed slope: %f",
-                calculated_concurrency,
-                target_time_metric,
-                observed_intercept,
-                observed_slope)
-    if calculated_concurrency <= 0:
-        raise ValueError(f"Calculated target concurrency ({calculated_concurrency}) is not positive. "
-                         f"This suggests the slope or intercept values may be invalid.")
-    # Estimate GPUs using the ratio of target users to target concurrency
-    # scaled by the test GPU count
-    gpu_estimate = (target_users / calculated_concurrency) * test_gpu_count
-    return gpu_estimate
-def calc_gpu_estimate_for_single_concurrency(target_llm_latency: float,
-                                             target_workflow_runtime: float,
-                                             target_users: int,
-                                             test_concurrency: int,
-                                             test_gpu_count: int,
-                                             observed_latency: float,
-                                             observed_runtime: float) -> GPUEstimates:
-    """
-    ROUGH ESTIMATE: Calculate GPU count estimate for a single concurrency level.
-    This is a simplified estimate that assumes linear scaling and should be used
-    as a baseline only. For more accurate estimates, use slope-based estimation
-    with multiple concurrency levels.
-    Formula based on the target latency:
-        G_required = (U_target / C_test) * (L_obs / L_target) * G_test
-    Formula based on the target runtime:
-        G_required = (U_target / C_test) * (R_obs / R_target) * G_test
-    where:
-        - U_target: Target number of users
-        - C_test: Test concurrency level
-        - L_obs: Observed LLM latency
-        - L_target: Target LLM latency
-        - R_obs: Observed workflow runtime
-        - R_target: Target workflow runtime
-        - G_test: Test GPU count
-    WARNING: This is a rough estimate that:
-    - Assumes perfect linear scaling (rarely true in practice)
-    - Doesn't account for GPU utilization inefficiencies
-    - May underestimate GPU requirements for high concurrency
-    - Should be validated against slope-based estimates
-    """
-    use_latency = target_llm_latency > 0
-    use_runtime = target_workflow_runtime > 0
-    # If observed latency or runtime exceeds the target, return empty estimates
-    if use_latency and observed_latency > target_llm_latency:
-        return GPUEstimates()
-    if use_runtime and observed_runtime > target_workflow_runtime:
-        return GPUEstimates()
-    # Calculate multipliers (how much faster we need to be)
-    llm_latency_multiplier = observed_latency / target_llm_latency if use_latency else 1.0
-    wf_runtime_multiplier = observed_runtime / target_workflow_runtime if use_runtime else 1.0
-    # Calculate GPU estimates using the corrected formula
-    gpu_estimate_by_wf_runtime = (target_users /
-                                  test_concurrency) * wf_runtime_multiplier * test_gpu_count if use_runtime else None
-    gpu_estimate_by_llm_latency = (target_users /
-                                   test_concurrency) * llm_latency_multiplier * test_gpu_count if use_latency else None
-    return GPUEstimates(gpu_estimate_by_wf_runtime=gpu_estimate_by_wf_runtime,
-                        gpu_estimate_by_llm_latency=gpu_estimate_by_llm_latency)

aiq/profiler/calc/data_models.py DELETED Viewed

@@ -1,188 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import typing
-from pathlib import Path
-from pydantic import BaseModel
-from pydantic import Field
-class FitConfig(BaseModel):
-    """
-    Configuration parameters for linear fit and outlier detection.
-    """
-    # Threshold for small concurrency range (≤ 8 points) to check for extreme outliers in raw y-values first
-    small_concurrency_range_threshold: int = 8
-    # Extreme outlier threshold is 2.0 times the IQR, extreme outliers are removed
-    extreme_outlier_threshold: float = 2.0
-    # Conservative outlier threshold is 1.5 times the IQR, conservative outliers are removed
-    conservative_outlier_threshold: float = 1.5
-    # Minimum R-squared value required for a valid linear fit
-    min_r_squared: float = 0.7
-    # Whether to remove outliers during linear fit calculation
-    remove_outliers: bool = True
-class CalcRunnerConfig(BaseModel):
-    """
-    Parameters used for a calc runner.
-    """
-    # base config and endpoints (if remote)- not needed in offline mode
-    config_file: Path | None = None
-    # endpoint to use for the workflow, if not provided the workflow is run locally
-    endpoint: str | None = None
-    # timeout for the workflow
-    endpoint_timeout: int = 300
-    # if true workflow is not run, instead results from previous runs are used to estimate the
-    # GPU count
-    offline_mode: bool = False
-    # number of passes at each concurrency, if 0 the dataset is adjusted to a multiple of the
-    # concurrency
-    num_passes: int = 0
-    # concurrency values to test
-    concurrencies: list[int] = [1, 2, 4, 8]
-    # Targets for GPU estimation
-    target_llm_latency_p95: float = 0
-    target_workflow_runtime_p95: float = 0
-    target_users: int = 0
-    # Test setup information needed for GPU estimation
-    test_gpu_count: int = 0
-    # output directory for results
-    output_dir: Path | None = None
-    # if true, the job is stored in a new subdirectory of the output directory
-    append_job: bool = False
-    # if true, the data is plotted
-    plot_data: bool = True
-    # Configuration for linear fit and outlier detection
-    fit_config: FitConfig = Field(default_factory=FitConfig)
-# Sizing metrics are gathered from the evaluation runs and used as input by the calculator.
-class SizingMetricPerItem(BaseModel):
-    """
-    Sizing metrics per dataset entry item.
-    """
-    # LLM latency
-    llm_latency: float
-    # workflow runtime
-    workflow_runtime: float
-class SizingMetricsAlerts(BaseModel):
-    """
-    Sizing metrics alerts.
-    """
-    # if true, the workflow was interrupted that concurrency cannot be used
-    workflow_interrupted: bool = False
-class SizingMetrics(BaseModel):
-    """
-    Sizing metrics for a single concurrency.
-    """
-    # alerts associated with the sizing metrics
-    alerts: SizingMetricsAlerts = Field(default_factory=SizingMetricsAlerts)
-    # p95 LLM latency
-    llm_latency_p95: float = 0.0
-    # p95 workflow runtime
-    workflow_runtime_p95: float = 0.0
-    # total workflow runtime
-    total_runtime: float = 0.0
-    # per item metrics, key is the dataset entry id
-    per_item_metrics: dict[typing.Any, SizingMetricPerItem] = {}
-class LinearFitResult(BaseModel):
-    """
-    Result of linear regression including slope, intercept, and quality metrics.
-    """
-    slope: float
-    intercept: float
-    r_squared: float
-    outliers_removed: list[int]
-class FitResults(BaseModel):
-    """
-    Linear fit results for both LLM latency and workflow runtime analysis.
-    """
-    llm_latency_fit: LinearFitResult | None = None
-    wf_runtime_fit: LinearFitResult | None = None
-# GPU estimates are generated by the calculator.
-class GPUEstimates(BaseModel):
-    """
-    GPU estimates.
-    """
-    # GPU estimate based on the workflow runtime
-    gpu_estimate_by_wf_runtime: float | None = None
-    # GPU estimate based on the LLM latency
-    gpu_estimate_by_llm_latency: float | None = None
-# Calc runner alerts are generated by the calculator.
-class CalcAlerts(BaseModel):
-    """
-    Calc runner alerts.
-    """
-    # if true, the run was identified as an outlier by the workflow runtime linear fit
-    outlier_workflow_runtime: bool = False
-    # if true, the run was identified as an outlier by the LLM latency linear fit
-    outlier_llm_latency: bool = False
-    # number of items that are greater than the target latency
-    num_items_greater_than_target_latency: int = 0
-    # number of items that are greater than the target runtime
-    num_items_greater_than_target_runtime: int = 0
-class CalcData(BaseModel):
-    """
-    Output of the calc runner per concurrency.
-    """
-    # ROUGH GPU estimates per concurrency: these are not used for the final GPU estimation
-    # they are only available for information purposes
-    gpu_estimates: GPUEstimates = Field(default_factory=GPUEstimates)
-    # Calc runner alerts
-    alerts: CalcAlerts = Field(default_factory=CalcAlerts)
-    # Sizing metrics
-    sizing_metrics: SizingMetrics = Field(default_factory=SizingMetrics)
-class CalcRunnerOutput(BaseModel):
-    """
-    Output of the calc runner.
-    """
-    # GPU estimates based on the slope of the time vs concurrency, calculated online or offline
-    gpu_estimates: GPUEstimates = Field(default_factory=GPUEstimates)
-    # Linear fit results for analysis and debugging
-    fit_results: FitResults = Field(default_factory=FitResults)
-    # Per-concurrency data (GPU estimates, out-of-range runs, and sizing metrics)
-    calc_data: dict[int, CalcData] = {}

aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl

Potentially problematic release.

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2rc9py3-none-any.whl