PyPI - aiqtoolkit - Versions diffs - 1.2.0rc4__py3-none-any.whl → 1.2.0rc5__py3-none-any.whl - Mend

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2.0rc5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show

aiqtoolkit-1.2.0rc5.dist-info/METADATA +29 -0
aiqtoolkit-1.2.0rc5.dist-info/RECORD +4 -0
aiqtoolkit-1.2.0rc5.dist-info/top_level.txt +1 -0
aiq/agent/__init__.py +0 -0
aiq/agent/base.py +0 -239
aiq/agent/dual_node.py +0 -67
aiq/agent/react_agent/__init__.py +0 -0
aiq/agent/react_agent/agent.py +0 -355
aiq/agent/react_agent/output_parser.py +0 -104
aiq/agent/react_agent/prompt.py +0 -41
aiq/agent/react_agent/register.py +0 -149
aiq/agent/reasoning_agent/__init__.py +0 -0
aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
aiq/agent/register.py +0 -23
aiq/agent/rewoo_agent/__init__.py +0 -0
aiq/agent/rewoo_agent/agent.py +0 -411
aiq/agent/rewoo_agent/prompt.py +0 -108
aiq/agent/rewoo_agent/register.py +0 -158
aiq/agent/tool_calling_agent/__init__.py +0 -0
aiq/agent/tool_calling_agent/agent.py +0 -119
aiq/agent/tool_calling_agent/register.py +0 -106
aiq/authentication/__init__.py +0 -14
aiq/authentication/api_key/__init__.py +0 -14
aiq/authentication/api_key/api_key_auth_provider.py +0 -96
aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
aiq/authentication/api_key/register.py +0 -26
aiq/authentication/exceptions/__init__.py +0 -14
aiq/authentication/exceptions/api_key_exceptions.py +0 -38
aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
aiq/authentication/exceptions/call_back_exceptions.py +0 -38
aiq/authentication/exceptions/request_exceptions.py +0 -54
aiq/authentication/http_basic_auth/__init__.py +0 -0
aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
aiq/authentication/http_basic_auth/register.py +0 -30
aiq/authentication/interfaces.py +0 -93
aiq/authentication/oauth2/__init__.py +0 -14
aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
aiq/authentication/oauth2/register.py +0 -25
aiq/authentication/register.py +0 -21
aiq/builder/__init__.py +0 -0
aiq/builder/builder.py +0 -285
aiq/builder/component_utils.py +0 -316
aiq/builder/context.py +0 -264
aiq/builder/embedder.py +0 -24
aiq/builder/eval_builder.py +0 -161
aiq/builder/evaluator.py +0 -29
aiq/builder/framework_enum.py +0 -24
aiq/builder/front_end.py +0 -73
aiq/builder/function.py +0 -344
aiq/builder/function_base.py +0 -380
aiq/builder/function_info.py +0 -627
aiq/builder/intermediate_step_manager.py +0 -174
aiq/builder/llm.py +0 -25
aiq/builder/retriever.py +0 -25
aiq/builder/user_interaction_manager.py +0 -74
aiq/builder/workflow.py +0 -148
aiq/builder/workflow_builder.py +0 -1117
aiq/cli/__init__.py +0 -14
aiq/cli/cli_utils/__init__.py +0 -0
aiq/cli/cli_utils/config_override.py +0 -231
aiq/cli/cli_utils/validation.py +0 -37
aiq/cli/commands/__init__.py +0 -0
aiq/cli/commands/configure/__init__.py +0 -0
aiq/cli/commands/configure/channel/__init__.py +0 -0
aiq/cli/commands/configure/channel/add.py +0 -28
aiq/cli/commands/configure/channel/channel.py +0 -36
aiq/cli/commands/configure/channel/remove.py +0 -30
aiq/cli/commands/configure/channel/update.py +0 -30
aiq/cli/commands/configure/configure.py +0 -33
aiq/cli/commands/evaluate.py +0 -139
aiq/cli/commands/info/__init__.py +0 -14
aiq/cli/commands/info/info.py +0 -39
aiq/cli/commands/info/list_channels.py +0 -32
aiq/cli/commands/info/list_components.py +0 -129
aiq/cli/commands/info/list_mcp.py +0 -213
aiq/cli/commands/registry/__init__.py +0 -14
aiq/cli/commands/registry/publish.py +0 -88
aiq/cli/commands/registry/pull.py +0 -118
aiq/cli/commands/registry/registry.py +0 -38
aiq/cli/commands/registry/remove.py +0 -108
aiq/cli/commands/registry/search.py +0 -155
aiq/cli/commands/sizing/__init__.py +0 -14
aiq/cli/commands/sizing/calc.py +0 -297
aiq/cli/commands/sizing/sizing.py +0 -27
aiq/cli/commands/start.py +0 -246
aiq/cli/commands/uninstall.py +0 -81
aiq/cli/commands/validate.py +0 -47
aiq/cli/commands/workflow/__init__.py +0 -14
aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
aiq/cli/commands/workflow/workflow.py +0 -37
aiq/cli/commands/workflow/workflow_commands.py +0 -313
aiq/cli/entrypoint.py +0 -135
aiq/cli/main.py +0 -44
aiq/cli/register_workflow.py +0 -488
aiq/cli/type_registry.py +0 -1000
aiq/data_models/__init__.py +0 -14
aiq/data_models/api_server.py +0 -694
aiq/data_models/authentication.py +0 -231
aiq/data_models/common.py +0 -171
aiq/data_models/component.py +0 -54
aiq/data_models/component_ref.py +0 -168
aiq/data_models/config.py +0 -406
aiq/data_models/dataset_handler.py +0 -123
aiq/data_models/discovery_metadata.py +0 -335
aiq/data_models/embedder.py +0 -27
aiq/data_models/evaluate.py +0 -127
aiq/data_models/evaluator.py +0 -26
aiq/data_models/front_end.py +0 -26
aiq/data_models/function.py +0 -30
aiq/data_models/function_dependencies.py +0 -72
aiq/data_models/interactive.py +0 -246
aiq/data_models/intermediate_step.py +0 -302
aiq/data_models/invocation_node.py +0 -38
aiq/data_models/its_strategy.py +0 -30
aiq/data_models/llm.py +0 -27
aiq/data_models/logging.py +0 -26
aiq/data_models/memory.py +0 -27
aiq/data_models/object_store.py +0 -44
aiq/data_models/profiler.py +0 -54
aiq/data_models/registry_handler.py +0 -26
aiq/data_models/retriever.py +0 -30
aiq/data_models/retry_mixin.py +0 -35
aiq/data_models/span.py +0 -187
aiq/data_models/step_adaptor.py +0 -64
aiq/data_models/streaming.py +0 -33
aiq/data_models/swe_bench_model.py +0 -54
aiq/data_models/telemetry_exporter.py +0 -26
aiq/embedder/__init__.py +0 -0
aiq/embedder/langchain_client.py +0 -41
aiq/embedder/nim_embedder.py +0 -59
aiq/embedder/openai_embedder.py +0 -43
aiq/embedder/register.py +0 -24
aiq/eval/__init__.py +0 -14
aiq/eval/config.py +0 -60
aiq/eval/dataset_handler/__init__.py +0 -0
aiq/eval/dataset_handler/dataset_downloader.py +0 -106
aiq/eval/dataset_handler/dataset_filter.py +0 -52
aiq/eval/dataset_handler/dataset_handler.py +0 -254
aiq/eval/evaluate.py +0 -506
aiq/eval/evaluator/__init__.py +0 -14
aiq/eval/evaluator/base_evaluator.py +0 -73
aiq/eval/evaluator/evaluator_model.py +0 -45
aiq/eval/intermediate_step_adapter.py +0 -99
aiq/eval/rag_evaluator/__init__.py +0 -0
aiq/eval/rag_evaluator/evaluate.py +0 -178
aiq/eval/rag_evaluator/register.py +0 -143
aiq/eval/register.py +0 -23
aiq/eval/remote_workflow.py +0 -133
aiq/eval/runners/__init__.py +0 -14
aiq/eval/runners/config.py +0 -39
aiq/eval/runners/multi_eval_runner.py +0 -54
aiq/eval/runtime_event_subscriber.py +0 -52
aiq/eval/swe_bench_evaluator/__init__.py +0 -0
aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
aiq/eval/swe_bench_evaluator/register.py +0 -36
aiq/eval/trajectory_evaluator/__init__.py +0 -0
aiq/eval/trajectory_evaluator/evaluate.py +0 -75
aiq/eval/trajectory_evaluator/register.py +0 -40
aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
aiq/eval/tunable_rag_evaluator/register.py +0 -52
aiq/eval/usage_stats.py +0 -41
aiq/eval/utils/__init__.py +0 -0
aiq/eval/utils/output_uploader.py +0 -140
aiq/eval/utils/tqdm_position_registry.py +0 -40
aiq/eval/utils/weave_eval.py +0 -184
aiq/experimental/__init__.py +0 -0
aiq/experimental/decorators/__init__.py +0 -0
aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
aiq/experimental/inference_time_scaling/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
aiq/experimental/inference_time_scaling/register.py +0 -36
aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
aiq/front_ends/__init__.py +0 -14
aiq/front_ends/console/__init__.py +0 -14
aiq/front_ends/console/authentication_flow_handler.py +0 -233
aiq/front_ends/console/console_front_end_config.py +0 -32
aiq/front_ends/console/console_front_end_plugin.py +0 -96
aiq/front_ends/console/register.py +0 -25
aiq/front_ends/cron/__init__.py +0 -14
aiq/front_ends/fastapi/__init__.py +0 -14
aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
aiq/front_ends/fastapi/job_store.py +0 -183
aiq/front_ends/fastapi/main.py +0 -72
aiq/front_ends/fastapi/message_handler.py +0 -298
aiq/front_ends/fastapi/message_validator.py +0 -345
aiq/front_ends/fastapi/register.py +0 -25
aiq/front_ends/fastapi/response_helpers.py +0 -195
aiq/front_ends/fastapi/step_adaptor.py +0 -321
aiq/front_ends/mcp/__init__.py +0 -14
aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
aiq/front_ends/mcp/register.py +0 -27
aiq/front_ends/mcp/tool_converter.py +0 -242
aiq/front_ends/register.py +0 -22
aiq/front_ends/simple_base/__init__.py +0 -14
aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
aiq/llm/__init__.py +0 -0
aiq/llm/aws_bedrock_llm.py +0 -57
aiq/llm/nim_llm.py +0 -46
aiq/llm/openai_llm.py +0 -46
aiq/llm/register.py +0 -23
aiq/llm/utils/__init__.py +0 -14
aiq/llm/utils/env_config_value.py +0 -94
aiq/llm/utils/error.py +0 -17
aiq/memory/__init__.py +0 -20
aiq/memory/interfaces.py +0 -183
aiq/memory/models.py +0 -112
aiq/meta/module_to_distro.json +0 -3
aiq/meta/pypi.md +0 -58
aiq/object_store/__init__.py +0 -20
aiq/object_store/in_memory_object_store.py +0 -76
aiq/object_store/interfaces.py +0 -84
aiq/object_store/models.py +0 -36
aiq/object_store/register.py +0 -20
aiq/observability/__init__.py +0 -14
aiq/observability/exporter/__init__.py +0 -14
aiq/observability/exporter/base_exporter.py +0 -449
aiq/observability/exporter/exporter.py +0 -78
aiq/observability/exporter/file_exporter.py +0 -33
aiq/observability/exporter/processing_exporter.py +0 -322
aiq/observability/exporter/raw_exporter.py +0 -52
aiq/observability/exporter/span_exporter.py +0 -265
aiq/observability/exporter_manager.py +0 -335
aiq/observability/mixin/__init__.py +0 -14
aiq/observability/mixin/batch_config_mixin.py +0 -26
aiq/observability/mixin/collector_config_mixin.py +0 -23
aiq/observability/mixin/file_mixin.py +0 -288
aiq/observability/mixin/file_mode.py +0 -23
aiq/observability/mixin/resource_conflict_mixin.py +0 -134
aiq/observability/mixin/serialize_mixin.py +0 -61
aiq/observability/mixin/type_introspection_mixin.py +0 -183
aiq/observability/processor/__init__.py +0 -14
aiq/observability/processor/batching_processor.py +0 -309
aiq/observability/processor/callback_processor.py +0 -42
aiq/observability/processor/intermediate_step_serializer.py +0 -28
aiq/observability/processor/processor.py +0 -71
aiq/observability/register.py +0 -96
aiq/observability/utils/__init__.py +0 -14
aiq/observability/utils/dict_utils.py +0 -236
aiq/observability/utils/time_utils.py +0 -31
aiq/plugins/.namespace +0 -1
aiq/profiler/__init__.py +0 -0
aiq/profiler/calc/__init__.py +0 -14
aiq/profiler/calc/calc_runner.py +0 -627
aiq/profiler/calc/calculations.py +0 -288
aiq/profiler/calc/data_models.py +0 -188
aiq/profiler/calc/plot.py +0 -345
aiq/profiler/callbacks/__init__.py +0 -0
aiq/profiler/callbacks/agno_callback_handler.py +0 -295
aiq/profiler/callbacks/base_callback_class.py +0 -20
aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
aiq/profiler/callbacks/token_usage_base_model.py +0 -27
aiq/profiler/data_frame_row.py +0 -51
aiq/profiler/data_models.py +0 -24
aiq/profiler/decorators/__init__.py +0 -0
aiq/profiler/decorators/framework_wrapper.py +0 -131
aiq/profiler/decorators/function_tracking.py +0 -254
aiq/profiler/forecasting/__init__.py +0 -0
aiq/profiler/forecasting/config.py +0 -18
aiq/profiler/forecasting/model_trainer.py +0 -75
aiq/profiler/forecasting/models/__init__.py +0 -22
aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
aiq/profiler/forecasting/models/linear_model.py +0 -196
aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
aiq/profiler/inference_metrics_model.py +0 -28
aiq/profiler/inference_optimization/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
aiq/profiler/inference_optimization/data_models.py +0 -386
aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
aiq/profiler/inference_optimization/llm_metrics.py +0 -212
aiq/profiler/inference_optimization/prompt_caching.py +0 -163
aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
aiq/profiler/intermediate_property_adapter.py +0 -102
aiq/profiler/profile_runner.py +0 -473
aiq/profiler/utils.py +0 -184
aiq/registry_handlers/__init__.py +0 -0
aiq/registry_handlers/local/__init__.py +0 -0
aiq/registry_handlers/local/local_handler.py +0 -176
aiq/registry_handlers/local/register_local.py +0 -37
aiq/registry_handlers/metadata_factory.py +0 -60
aiq/registry_handlers/package_utils.py +0 -567
aiq/registry_handlers/pypi/__init__.py +0 -0
aiq/registry_handlers/pypi/pypi_handler.py +0 -251
aiq/registry_handlers/pypi/register_pypi.py +0 -40
aiq/registry_handlers/register.py +0 -21
aiq/registry_handlers/registry_handler_base.py +0 -157
aiq/registry_handlers/rest/__init__.py +0 -0
aiq/registry_handlers/rest/register_rest.py +0 -56
aiq/registry_handlers/rest/rest_handler.py +0 -237
aiq/registry_handlers/schemas/__init__.py +0 -0
aiq/registry_handlers/schemas/headers.py +0 -42
aiq/registry_handlers/schemas/package.py +0 -68
aiq/registry_handlers/schemas/publish.py +0 -63
aiq/registry_handlers/schemas/pull.py +0 -82
aiq/registry_handlers/schemas/remove.py +0 -36
aiq/registry_handlers/schemas/search.py +0 -91
aiq/registry_handlers/schemas/status.py +0 -47
aiq/retriever/__init__.py +0 -0
aiq/retriever/interface.py +0 -37
aiq/retriever/milvus/__init__.py +0 -14
aiq/retriever/milvus/register.py +0 -81
aiq/retriever/milvus/retriever.py +0 -228
aiq/retriever/models.py +0 -74
aiq/retriever/nemo_retriever/__init__.py +0 -14
aiq/retriever/nemo_retriever/register.py +0 -60
aiq/retriever/nemo_retriever/retriever.py +0 -190
aiq/retriever/register.py +0 -22
aiq/runtime/__init__.py +0 -14
aiq/runtime/loader.py +0 -215
aiq/runtime/runner.py +0 -190
aiq/runtime/session.py +0 -158
aiq/runtime/user_metadata.py +0 -130
aiq/settings/__init__.py +0 -0
aiq/settings/global_settings.py +0 -318
aiq/test/.namespace +0 -1
aiq/tool/__init__.py +0 -0
aiq/tool/chat_completion.py +0 -74
aiq/tool/code_execution/README.md +0 -151
aiq/tool/code_execution/__init__.py +0 -0
aiq/tool/code_execution/code_sandbox.py +0 -267
aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
aiq/tool/code_execution/register.py +0 -74
aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
aiq/tool/code_execution/utils.py +0 -100
aiq/tool/datetime_tools.py +0 -42
aiq/tool/document_search.py +0 -141
aiq/tool/github_tools/__init__.py +0 -0
aiq/tool/github_tools/create_github_commit.py +0 -133
aiq/tool/github_tools/create_github_issue.py +0 -87
aiq/tool/github_tools/create_github_pr.py +0 -106
aiq/tool/github_tools/get_github_file.py +0 -106
aiq/tool/github_tools/get_github_issue.py +0 -166
aiq/tool/github_tools/get_github_pr.py +0 -256
aiq/tool/github_tools/update_github_issue.py +0 -100
aiq/tool/mcp/__init__.py +0 -14
aiq/tool/mcp/exceptions.py +0 -142
aiq/tool/mcp/mcp_client.py +0 -255
aiq/tool/mcp/mcp_tool.py +0 -96
aiq/tool/memory_tools/__init__.py +0 -0
aiq/tool/memory_tools/add_memory_tool.py +0 -79
aiq/tool/memory_tools/delete_memory_tool.py +0 -67
aiq/tool/memory_tools/get_memory_tool.py +0 -72
aiq/tool/nvidia_rag.py +0 -95
aiq/tool/register.py +0 -38
aiq/tool/retriever.py +0 -89
aiq/tool/server_tools.py +0 -66
aiq/utils/__init__.py +0 -0
aiq/utils/data_models/__init__.py +0 -0
aiq/utils/data_models/schema_validator.py +0 -58
aiq/utils/debugging_utils.py +0 -43
aiq/utils/dump_distro_mapping.py +0 -32
aiq/utils/exception_handlers/__init__.py +0 -0
aiq/utils/exception_handlers/automatic_retries.py +0 -289
aiq/utils/exception_handlers/mcp.py +0 -211
aiq/utils/exception_handlers/schemas.py +0 -114
aiq/utils/io/__init__.py +0 -0
aiq/utils/io/model_processing.py +0 -28
aiq/utils/io/yaml_tools.py +0 -119
aiq/utils/log_utils.py +0 -37
aiq/utils/metadata_utils.py +0 -74
aiq/utils/optional_imports.py +0 -142
aiq/utils/producer_consumer_queue.py +0 -178
aiq/utils/reactive/__init__.py +0 -0
aiq/utils/reactive/base/__init__.py +0 -0
aiq/utils/reactive/base/observable_base.py +0 -65
aiq/utils/reactive/base/observer_base.py +0 -55
aiq/utils/reactive/base/subject_base.py +0 -79
aiq/utils/reactive/observable.py +0 -59
aiq/utils/reactive/observer.py +0 -76
aiq/utils/reactive/subject.py +0 -131
aiq/utils/reactive/subscription.py +0 -49
aiq/utils/settings/__init__.py +0 -0
aiq/utils/settings/global_settings.py +0 -197
aiq/utils/string_utils.py +0 -38
aiq/utils/type_converter.py +0 -290
aiq/utils/type_utils.py +0 -484
aiq/utils/url_utils.py +0 -27
aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
{aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2.0rc5.dist-info}/WHEEL +0 -0

aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py DELETED Viewed

@@ -1,258 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-Advanced bottleneck analysis for a dataframe that contains:
-- event_type in {LLM_START, LLM_END, TOOL_START, TOOL_END, ...}
-- llm_name
-- tool_name
-- UUID
-- event_timestamp (float or datetime)
-- other metadata...
-We pair start/end events by UUID, compute operation durations,
-then analyze concurrency and produce a summary report.
-"""
-import numpy as np
-import pandas as pd
-from aiq.data_models.intermediate_step import IntermediateStep
-from aiq.profiler.inference_optimization.data_models import SimpleBottleneckReport
-from aiq.profiler.inference_optimization.data_models import SimpleOperationStats
-from aiq.profiler.utils import create_standardized_dataframe
-# ----------------------------------------------------------------------
-# Main Function
-# ----------------------------------------------------------------------
-def profile_workflow_bottlenecks(all_steps: list[list[IntermediateStep]]) -> SimpleBottleneckReport:
-    """
-    Perform advanced bottleneck profiling on a workflow dataframe.
-    1) Pair LLM_START/LLM_END and TOOL_START/TOOL_END by UUID.
-    2) Compute operation durations.
-    3) Analyze concurrency (max concurrent usage).
-    4) Summarize as SimpleOperationStats and produce a final SimpleBottleneckReport.
-    Parameters
-    ----------
-    all_steps : Intermediate Steps
-    Returns
-    -------
-    SimpleBottleneckReport
-        Contains detailed stats per operation and a textual summary of top bottlenecks.
-    """
-    df = create_standardized_dataframe(all_steps)
-    # -------------------------------------------------------------
-    # 1) Separate events by operation type and match start/end
-    # -------------------------------------------------------------
-    required_cols = {"event_type", "UUID", "event_timestamp"}
-    missing_cols = required_cols - set(df.columns)
-    if missing_cols:
-        raise ValueError(f"DataFrame missing required columns: {missing_cols}")
-    # We'll unify LLM and TOOL operations into a single set, with:
-    #   operation_type = 'LLM' or 'TOOL'
-    #   operation_name = llm_name/tool_name
-    #   start_time
-    #   end_time
-    #   duration = end_time - start_time
-    # We'll store them in a list of dicts, then convert to DataFrame.
-    operations_records = []
-    # We'll create a copy to avoid mutating user data
-    dfc = df.copy()
-    # We define a small helper to map event_type -> (operation_type, which_name_field)
-    def get_operation_info(event_type: str) -> str | None:
-        """
-        Return 'LLM' if event_type starts with 'LLM_', 'TOOL' if event_type starts with 'TOOL_',
-        else None (unknown).
-        """
-        if event_type.startswith("LLM_"):
-            return "LLM"
-        if event_type.startswith("TOOL_"):
-            return "TOOL"
-        return None
-    # Group by UUID so we can pair each START with the corresponding END
-    grouped = dfc.groupby("UUID", as_index=False, group_keys=True)
-    for uuid_val, group_df in grouped:
-        if len(group_df) < 2:
-            # Possibly incomplete or single event, skip
-            continue
-        # We might have multiple events with the same UUID, but typically we expect:
-        #   LLM_START, LLM_END (or TOOL_START, TOOL_END).
-        # Sort by timestamp
-        group_df = group_df.sort_values("event_timestamp")
-        # Identify operation_type from the first row's event_type
-        first_event_type = group_df["event_type"].iloc[0]
-        operation_type = get_operation_info(first_event_type)
-        if not operation_type:
-            # unknown or not LLM_/TOOL_
-            continue
-        # We'll attempt to find the start row and the end row
-        # Usually there's exactly 1 start, 1 end
-        start_rows = group_df[group_df["event_type"] == f"{operation_type}_START"]
-        end_rows = group_df[group_df["event_type"] == f"{operation_type}_END"]
-        if len(start_rows) == 0 or len(end_rows) == 0:
-            # No matching start/end
-            continue
-        # We'll just take the earliest start and the latest end for the entire group.
-        start_time = start_rows["event_timestamp"].min()
-        end_time = end_rows["event_timestamp"].max()
-        duration = end_time - start_time
-        # For the name, we pick 'llm_name' or 'tool_name' depending on operation_type
-        if operation_type == "LLM":
-            # Among the rows, pick a non-null llm_name if present
-            op_names = group_df["llm_name"].dropna().unique()
-            # fallback to a default if none
-            operation_name = op_names[0] if len(op_names) else "unknown_llm"
-        else:
-            op_names = group_df["tool_name"].dropna().unique()
-            operation_name = op_names[0] if len(op_names) else "unknown_tool"
-        operations_records.append({
-            "operation_type": operation_type,
-            "operation_name": operation_name,
-            "start_time": start_time,
-            "end_time": end_time,
-            "duration": duration,
-            "UUID": uuid_val
-        })
-    if not operations_records:
-        # No valid operations found
-        return SimpleBottleneckReport(stats={}, summary="No operations found to profile.")
-    operations_df = pd.DataFrame(operations_records)
-    # -------------------------------------------------------------
-    # 2) Concurrency Analysis
-    # -------------------------------------------------------------
-    # We want to find the maximum concurrency for each operation_name.
-    # We'll do a timeline-based approach: for each operation we have a start_time, end_time
-    # We'll create +1 event at start_time, -1 event at end_time, then do a running sum.
-    # Then we can measure concurrency across the entire timeline. However, we want concurrency
-    # specifically *by operation_name* as well as overall.
-    #
-    # We'll do it in two passes:
-    #   A) Overall concurrency ignoring operation_name
-    #   B) concurrency per (operation_type, operation_name)
-    # Then we can combine them for a "peak concurrency" measure.
-    # A) Overall concurrency (not always essential, but might be interesting)
-    timeline_events = []
-    for row in operations_df.itertuples(index=False):
-        timeline_events.append((row.start_time, +1))
-        timeline_events.append((row.end_time, -1))
-    timeline_events.sort(key=lambda x: x[0])  # sort by time
-    current_concurrency = 0
-    concurrency_trace = []
-    for ts, delta in timeline_events:
-        current_concurrency += delta
-        concurrency_trace.append((ts, current_concurrency))
-    overall_max_concurrency = max(c[1] for c in concurrency_trace) if concurrency_trace else 0
-    # B) concurrency by operation_name
-    # We'll generate timeline events per operation_name
-    # Then compute the max concurrency for that subset
-    operation_names = operations_df["operation_name"].unique()
-    max_concurrency_by_name = {}
-    for op_name in operation_names:
-        sub = operations_df[operations_df["operation_name"] == op_name]
-        events_sub = []
-        for row in sub.itertuples(index=False):
-            events_sub.append((row.start_time, +1))
-            events_sub.append((row.end_time, -1))
-        if not events_sub:
-            max_concurrency_by_name[op_name] = 0
-            continue
-        events_sub.sort(key=lambda x: x[0])
-        c_curr = 0
-        c_max = 0
-        for ts, delta in events_sub:
-            c_curr += delta
-            if c_curr > c_max:  # pylint: disable=consider-using-max-builtin
-                c_max = c_curr
-        max_concurrency_by_name[op_name] = c_max
-    # -------------------------------------------------------------
-    # 3) Compute summary stats per (operation_type, operation_name)
-    # -------------------------------------------------------------
-    # We'll gather durations in a list, compute average, p95, p99, etc.
-    stats_dict = {}
-    grouped_ops = operations_df.groupby(["operation_type", "operation_name"])
-    for (op_type, op_name), grp in grouped_ops:
-        durations = grp["duration"].values
-        usage_count = len(durations)
-        avg_duration = durations.mean()
-        p95_duration = np.percentile(durations, 95)
-        p99_duration = np.percentile(durations, 99)
-        # concurrency
-        max_concur = max_concurrency_by_name.get(op_name, 0)
-        # define a custom "bottleneck_score":
-        # We say score = avg_duration * max_concurrency,
-        bottleneck_score = float(avg_duration * max_concur)
-        # store in dictionary
-        key = f"{op_type}:{op_name}"
-        stats_dict[key] = SimpleOperationStats(operation_type=op_type,
-                                               operation_name=op_name,
-                                               usage_count=usage_count,
-                                               avg_duration=float(avg_duration),
-                                               p95_duration=float(p95_duration),
-                                               p99_duration=float(p99_duration),
-                                               max_concurrency=int(max_concur),
-                                               bottleneck_score=bottleneck_score)
-    # -------------------------------------------------------------
-    # 4) Produce a textual summary highlighting top bottlenecks
-    # -------------------------------------------------------------
-    # We'll rank by bottleneck_score descending and show top 3.
-    if not stats_dict:
-        return SimpleBottleneckReport(stats={}, summary="No stats to report.")
-    top_items = sorted(stats_dict.values(), key=lambda x: x.bottleneck_score, reverse=True)
-    top_3 = top_items[:3]
-    # Build a simple textual summary
-    lines = []
-    lines.append("---- BOTTLENECK REPORT ----")
-    lines.append(f"Total distinct operations found: {len(stats_dict)}")
-    lines.append(f"Overall max concurrency (all ops): {overall_max_concurrency}")
-    lines.append("Top 3 Bottlenecks by bottleneck_score (avg_duration * max_concurrency):")
-    for i, item in enumerate(top_3, start=1):
-        lines.append(f"{i}) {item.operation_type} '{item.operation_name}': "
-                     f"score={item.bottleneck_score:.2f}, "
-                     f"avg_dur={item.avg_duration:.2f}, "
-                     f"max_concurrency={item.max_concurrency}")
-    summary_report = "\n".join(lines)
-    # Construct a final Pydantic model
-    return SimpleBottleneckReport(stats=stats_dict, summary=summary_report)

aiq/profiler/inference_optimization/data_models.py DELETED Viewed

@@ -1,386 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-from typing import Any
-from pydantic import BaseModel
-from pydantic import ConfigDict
-from pydantic import Field
-from pydantic import RootModel
-# -----------------------------------------------------------
-# Prompt Caching Data Models
-# -----------------------------------------------------------
-class PrefixInfo(BaseModel):
-    """
-    Stores metadata about a particular prefix observed in the LLM text input.
-    """
-    prefix: str
-    prefix_length: int
-    calls_count: int
-    calls_percentage: float = Field(..., ge=0.0, le=1.0)
-class FrameworkLLMPrefixData(BaseModel):
-    """
-    Metadata for a single (framework, llm_name) group,
-    including total calls and all prefix statistics.
-    """
-    total_calls: int
-    prefix_info: list[PrefixInfo]
-class CommonPrefixesOutput(RootModel[dict[str, FrameworkLLMPrefixData]]):
-    """
-    A root model storing a dictionary keyed by '<framework>-<llm>',
-    each value is a FrameworkLLMPrefixData instance.
-    """
-    def to_dict(self) -> dict[str, FrameworkLLMPrefixData]:
-        """
-        Return the raw dictionary of data, discarding the 'root' wrapper.
-        """
-        return self.root
-# ----------------------------------------------------------------
-# Token Uniqueness Models
-# ----------------------------------------------------------------
-class LLMUniquenessMetrics(BaseModel):
-    """
-    Stores p90, p95, and p99 for the 'new words' metric.
-    """
-    p90: float
-    p95: float
-    p99: float
-class LLMUniquenessMetricsByLLM(RootModel[dict[str, LLMUniquenessMetrics]]):
-    """
-    A RootModel containing a dictionary where each key is an LLM name
-    and each value is the LLMUniquenessMetrics for that LLM.
-    """
-    def to_dict(self) -> dict[str, Any]:
-        # Return the raw dictionary for convenience
-        return self.root
-# ----------------------------------------------------------------
-# Workflow Runtime Models
-# ----------------------------------------------------------------
-class WorkflowRuntimeMetrics(BaseModel):
-    """
-    Stores p90, p95, and p99 for workflow runtimes across all examples.
-    """
-    p90: float
-    p95: float
-    p99: float
-# ----------------------------------------------------------------------
-# Simple Bottleneck Detection Models
-# ----------------------------------------------------------------------
-class SimpleOperationStats(BaseModel):
-    """
-    Statistics for a particular operation name (LLM or tool),
-    capturing concurrency, duration, usage, etc.
-    """
-    operation_type: str  # 'LLM' or 'TOOL'
-    operation_name: str  # e.g., "llama-3" or "serpapi"
-    usage_count: int  # how many times it appears
-    avg_duration: float  # average duration
-    p95_duration: float
-    p99_duration: float
-    max_concurrency: int  # maximum number of concurrent operations
-    bottleneck_score: float = Field(..., description="Custom metric to rank bottlenecks.")
-class SimpleBottleneckReport(BaseModel):
-    """
-    A container for all operation stats keyed by 'operation_type:operation_name',
-    plus a textual summary that highlights top bottlenecks.
-    """
-    stats: dict[str, SimpleOperationStats]
-    summary: str
-# ----------------------------------------------------------------------
-# Nested Bottleneck Models
-# ----------------------------------------------------------------------
-class CallNode(BaseModel):
-    """
-    A single call (LLM or TOOL) in a nested call tree.
-    Attributes
-    ----------
-    uuid: str
-        Unique ID tying together START/END events.
-    operation_type: str
-        e.g. 'LLM' or 'TOOL'.
-    operation_name: str
-        e.g. 'llama-3', 'bing-search', ...
-    start_time: float
-        Time when the call started.
-    end_time: float
-        Time when the call ended.
-    duration: float
-        end_time - start_time
-    children: list["CallNode"]
-        List of nested calls inside this call's time window.
-    parent: "CallNode" | None
-        Reference to the parent call in the tree (None if top-level).
-    """
-    model_config = ConfigDict(arbitrary_types_allowed=True)
-    uuid: str
-    operation_type: str
-    operation_name: str
-    start_time: float
-    end_time: float
-    duration: float = Field(..., description="end_time - start_time")
-    children: list["CallNode"] = Field(default_factory=list)
-    parent: "CallNode | None" = None
-    def compute_self_time(self) -> float:
-        """
-        'Self time' = duration minus the union of child intervals.
-        Overlapping child intervals are merged so we don't double-count them.
-        """
-        if not self.children:
-            return self.duration
-        intervals = [(c.start_time, c.end_time) for c in self.children]  # pylint: disable=not-an-iterable
-        # Sort by start time
-        intervals.sort(key=lambda x: x[0])
-        merged = []
-        cur_start, cur_end = intervals[0]
-        for i in range(1, len(intervals)):
-            s, e = intervals[i]
-            if s <= cur_end:
-                # Overlap
-                cur_end = max(cur_end, e)
-            else:
-                merged.append((cur_start, cur_end))
-                cur_start, cur_end = s, e
-        merged.append((cur_start, cur_end))
-        # Sum coverage, clamped to [start_time, end_time]
-        covered = 0.0
-        for (s, e) in merged:
-            s_clamped = max(s, self.start_time)
-            e_clamped = min(e, self.end_time)
-            if e_clamped > s_clamped:
-                covered += (e_clamped - s_clamped)
-        return max(0.0, self.duration - covered)
-    def compute_subtree_time(self) -> float:
-        """
-        Recursively compute the sum of self_time + children's subtree_time.
-        This ensures no overlap double-counting among children.
-        """
-        total = self.compute_self_time()
-        for c in self.children:  # pylint: disable=not-an-iterable
-            total += c.compute_subtree_time()
-        return total
-    def __str__(self) -> str:
-        return self._repr(0)
-    def _repr(self, level: int) -> str:
-        indent = "  " * level
-        info = (f"{indent}- {self.operation_type} '{self.operation_name}' "
-                f"(uuid={self.uuid}, start={self.start_time:.2f}, "
-                f"end={self.end_time:.2f}, dur={self.duration:.2f})")
-        child_strs = [child._repr(level + 1) for child in self.children]  # pylint: disable=not-an-iterable
-        return "\n".join([info] + child_strs)
-CallNode.model_rebuild()
-class NodeMetrics(BaseModel):
-    """
-    Metrics for a single node:
-      - self_time
-      - subtree_time
-      - concurrency_midpoint (optional)
-      - bottleneck_score (example: subtree_time)
-    """
-    uuid: str
-    operation_type: str
-    operation_name: str
-    start_time: float
-    end_time: float
-    duration: float
-    self_time: float
-    subtree_time: float
-    concurrency_midpoint: float | None = None
-    bottleneck_score: float
-class ConcurrencyDistribution(BaseModel):
-    """
-    Overall concurrency distribution info:
-      - timeline_segments: List of (start, end, concurrency)
-      - p50, p90, p95, p99 concurrency
-    """
-    timeline_segments: list[tuple[float, float, int]]
-    p50: float
-    p90: float
-    p95: float
-    p99: float
-class NestedCallProfilingResult(BaseModel):
-    """
-    The final Pydantic model returned by 'multi_example_call_profiling'.
-    Contains:
-      - concurrency: ConcurrencyDistribution
-      - node_metrics: dict[uuid, NodeMetrics]
-      - top_bottlenecks: The top calls by bottleneck_score
-      - textual_report: A multiline string summarizing everything
-    """
-    concurrency: ConcurrencyDistribution
-    node_metrics: dict[str, NodeMetrics]
-    top_bottlenecks: list[NodeMetrics]
-    textual_report: str
-# ----------------------------------------------------------------------
-# Concurrency Spike Analysis Models
-# ----------------------------------------------------------------------
-class ConcurrencyCallNode(CallNode):
-    """
-    A single call in the nested call tree for one example.
-    Each call is matched by a UUID with a `*_START` and `*_END` event.
-    Because fields like prompt_tokens, completion_tokens, total_tokens
-    may only exist at the END event, we store them only after seeing `*_END`".
-    """
-    example_number: int
-    # Additional fields from END events
-    prompt_tokens: int | None = None
-    completion_tokens: int | None = None
-    total_tokens: int | None = None
-    tool_outputs: str | None = None
-    llm_text_output: str | None = None
-ConcurrencyCallNode.model_rebuild()
-class ConcurrencySpikeInfo(BaseModel):
-    """
-    Info about one concurrency spike interval:
-    - start, end of the spike
-    - concurrency level
-    - list of calls that overlap
-    """
-    start_time: float
-    end_time: float
-    concurrency: int
-    active_uuids: list[str] = Field(default_factory=list)
-class ConcurrencyCorrelationStats(BaseModel):
-    """
-    Simple container for correlation / summarized stats of calls overlapping concurrency spikes.
-    """
-    avg_prompt_tokens: float
-    avg_total_tokens: float
-class ConcurrencyAnalysisResult(BaseModel):
-    """
-    The final Pydantic model returned by concurrency_spike_analysis(...).
-    Contains:
-    - concurrency_distribution: concurrency_level => total_time
-    - p50_concurrency, p90_concurrency, p95_concurrency, p99_concurrency
-    - spike_threshold, spike_intervals
-    - correlation_stats
-    - textual_report
-    """
-    concurrency_distribution: dict[int, float]
-    p50_concurrency: float
-    p90_concurrency: float
-    p95_concurrency: float
-    p99_concurrency: float
-    spike_threshold: int
-    spike_intervals: list[ConcurrencySpikeInfo]
-    correlation_stats: ConcurrencyCorrelationStats
-    average_latency_by_concurrency: dict[int, float]
-    textual_report: str
-# ----------------------------------------------------------------------
-# PrefixSpan Analysis Models
-# ----------------------------------------------------------------------
-class PrefixCallNode(BaseModel):
-    """
-    Represents a single call in an example's workflow.
-    - For LLM calls, we also store llm_text_input if available so we can incorporate it into the token.
-    """
-    uuid: str
-    example_number: int
-    operation_type: str  # "LLM" or "TOOL"
-    operation_name: str  # e.g. "llama-3", "internet-search"
-    start_time: float
-    end_time: float
-    duration: float
-    llm_text_input: str | None = None
-class FrequentPattern(BaseModel):
-    """
-    Frequent sub-sequence discovered by PrefixSpan, with coverage and average duration data.
-    """
-    pattern: list[str]  # e.g. ["LLM:llama-3|Hello world", "TOOL:internet-search"]
-    frequency: int  # total occurrences across all examples
-    coverage: float  # fraction of distinct examples that contain this pattern
-    average_duration: float  # average sum of call durations for calls in that sub-sequence
-    examples_containing: list[int]  # which examples have at least one occurrence
-class PrefixSpanSubworkflowResult(BaseModel):
-    """
-    Pydantic model for the final outcome:
-    - A list of frequent patterns
-    - A textual summary
-    """
-    patterns: list[FrequentPattern]
-    textual_report: str

aiq/profiler/inference_optimization/experimental/__init__.py DELETED Viewed

File without changes

aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2.0rc5__py3-none-any.whl

Potentially problematic release.

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2.0rc5py3-none-any.whl